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% lexsemsub.pl 

% lexsemsub . pat 

% revised March 17, 2000 

% LEXICON OF SUBSTANCES AND STRUCTURES 

2'2'2'S^2'2'2'2'2'£^^2'2'2'S^2'2'2-2'S^2-2'2'2'^9'9'9'2'2^ o o o o o o o o o o 

o o o o o o o"o o o o o o o o o o o o o o o o o o o^^^^^^^^^^^^^^^^^^^^^^^^^^^^'o'5'5'5'5'5'5'5*5 

multifile (phrase/5) . 
multifile (wdef/3) . 
unknown (_, fail ) . 

phrase ('[» , protein, [ 1 [ ' , gamma, »] 1 , ' -', aminobutyric , acid, a], 'GA 
BAA ' , r) . % ? 

phrase ('[', smallmolecule, [ • [ ' , zeta, ' ] ' , 1 , subunit] , ' [zeta]l subu 
nit 1 , r) . % ? 

phrase (116 , protein, [116 , 1 - ' , kd, fyn, ' - ' , associated, protein] , 1 116-k 
D Fyn-assGciated protein' ,r) . 

phrase (116 , protein, [116 , ' - ' , kd, protein] , 1 116 -kd protein '_, r) . 

phrase-( 3 , protein, [3 , ' - ' , kinase, 1 - 1 , akt] , ' 3-kinase-Akt 1 , r) . 

phrase (ability , affirmation, [ability, to], [] , r) . 

phrase (age, protein, [age, protein, kinases], 'AGC, r) . 

phrase (akt , protein, [akt, mutant], 'Akt mutant', r) . 

phrase (alternative, substance, [alternative , ntf] , 'alternative NTF ' ,r 

) . 

phrase (antibody , protein, [antibody, to, phosphotyrosine] , 'anti-phosp 
hotyrosine ' , r) . 

phrase (antigen, complex, [antigen, receptor] , 'antigen receptor' ,r) . 
phrase (ap, protein, [ap, ' - ' , 1] , 1 AP-1 ' , r) . 

phrase (aspargine, site, [aspargine, ' - ' , 141] , ' aspargine-141 ' , r) . 
phrase (b, cell, [b,cell], 'B cell', r) . 
phrase(b, cell, [b, cells], 'B cell 1 , r) . 

phrase(b, species , [b , lymphoblastoid, cells] , 'B lymphoblastoid cell 
s' ,r) . 

phrase (b, cell , [b, lymphoblastoid, cells] , 'B lymphoblastoid cells', r 
) . 

phrase (b7, protein, [b7 ,'-',' 1 '] , ! B7-l',r). 
phrase (bcl , protein, [bcl , ' - ' , 2] , ' Bcl-2 ' , r) . 
phrase (c, protein, [c,'-',jun] , 'c-Jun' ,r) . 
phrase(camk, protein, [camk, iv] , ' CaMK IV , r) . 
phrase (casp, protein, [casp, 1 - ' , 3] , ' caspase-3 1 , r) . 

phrase (caspase, protein, [caspase, '-', 3 , family , protease] , 'caspase-3 

family protease' ,r) . 
phrase (caspase, protein, [caspase, '-', 3 , precursor] , 'caspase-3 precur 
sor ' , r) . 

phrase (caspase, protein, [caspase, 1 - ' , 3] , ' caspase-3 * , r) . 
phrase (caspase, protein, [caspase, - , 3] , ' caspase-3 1 , r) . 
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phrase (caspase, protein, [caspase, ' - * , 6] , ' caspase-6 1 , r) . 

phrase (caspase, protein, [caspase, ' - ' , 7] , ' caspase-7 ' , r) . 

phrase (catalytic, domain, [catalytic, domain], 'catalytic domain' , 

r) . 

phrase (cleavage, site, [cleavage , site] , 'cleavage site',r) . 

phrase (cleavage, substance, [cleavage, products] , 'cleavage products', 

r) . 

phrase (cooh, substance, [cooh, '-' , terminal , fragment] , * COOH- termina 
1 fragment ' , r) . 

phrase (crk, protein, [crk, proteins] , ' crk proteins ', rO . 

phrase (crkl , complex, [crkl , ' - ' , c3g, complex] , ' crkl-c3g complex ' , r) . 

phrase (dcp, protein, [dcp, - , 1] , ' DCP-1 ' , r) . 

phrase(did, negation, [did, not], not, r) . 

phrase (ebv. species , ' Eps-tein-Barr virus', r) . 

phrase (epstein, species, [epstein, ' - ' , barr, virus] , ' Epstein-Barr vi 
rus ' , r) . - ■ - - 

phrase (familial , disease, [familial , alzheimer , ' ' ' ' , s , disease] , ' f amil 
ial Alzheimer ' ' ' ' s disease ' , r) . 

phrase (gene, gene, [gene , encoding, interleukin, '-' ,2] , 'gene encodin 
g interleukin-2 ' , r) . 

phrase (gst , protein, [gst, 1 - ' , ' fyn' , ' - * , sh2] , ' GST-Fyn-SH2 ' , r) . 
phrase (gst, protein, [gst ,'-',» fyn ','-', sh3 ] , ' GST-Fyn-SH3 ' , r) . 
phrase(gtp, complex, [gtp, exchange , of , rapl] , 1 GTP exchange of Rapl * , 
r) . 

phrase (guanidine, protein, [guanidine, nucleotide, ' - * , releasing, f ac 
tor,c3g] , 'guanidine nucleotide-releasing factor C3G' ,r) . 
phrase (guanidine, smallmolecule , [guanidine, nucleotide] , 'guanidine 
nucleotide ' , r) . 

phrase (guanosine, smallmolecule, [guanosine, triphosphate] , 'guanosin 
e triphosphate' ,r) . 

phrase (guanosine, smallmolecule, [guanosine , diphosphate] , 'guanosine 
diphosphate ' , r) . 

phrase (h4 , cell , [h4 , cell, line] , 'H4 cell line',r). 

phrase (h4 , cell , [h4 , human, neuroglioma, cells] , ' H4 , human, neuroglioma 
, cells ' , r) . 

phrase (ha, protein, [ha, ' - ' , ' [ ' , delta, ' ] ■ ,phpkb] , 'HA- [Delta] PHPK 
B ' , r) . 

phrase (hla, protein, [hla, ' - ' , dr7] , ' HLA-DR7 ' , r) . 

phrased, protein, [i, ■[', kappa, ']» ,b, • -','[* ,beta, ']'] , ■ I [ka 
ppa] B- [beta] ' , r) . 

phrase (i, protein, [i, ' [ ' , kappa, ']', b, '-','[ ' , alpha, ' ] ' ] , 'I [kap 
pa] B- [alpha] ' , r) . 

phrase (i, protein, [i, ! [ ! , kappa, ']',b], ' I [kappa] B ' , r) . 
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Ell 


phrase ( 




phrase ( 




phrase ( 




phrase ( 




agment ' 




phrase ( 




, r) . 
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phrase ( 




phrase ( 




, r) . 



ice, protein, [ice, '/' ,ced, 1 
il, gene, [il , ' - ' , 2 , gene] , 



1 ,3] , ' ICE/Ced-3 ' ,r) . 

'gene encoding interleukin-2 



il, protein, [il, , - , ,2], * interleukin-2 1 , r) . 
in, interm, [in, the, case, of] , [] , r) . 
in, state, [in, the , anergic , state] , inactive, r) . 
inducible, cell, [inducible , h4 , cell] , 'inducible H4 cellar 

interleukin, protein, [interleukin, ' - ' , 2] , r) . 
interleukin, protein, [interleukin, 3], ' interleukin-3 

interleukin, protein, [interleukin, '-', 1 , beta, converting, enzy 
nterleukin-1 beta converting enzyme' ,r). 
jurkat, cell, [jurkat, cell], ' Jurkat cell 1 , r) . 
jurkat, cell, [jurkat, cells], ' Jurkat cell 1 , rX . - = 

kif 3a, protein, [kif3a, '/ ' ,3, b] , ' KIF3A/3B 1 , r) . 
lbl, cell, [lbl, ' - > ,drf , cells], 1 LBL-DR7 cells', r). 
lbl,cell, [lbl, ' - ' ,dr7, cells] , 1 LBL-DR7 cells' , r) . 
let, protein, [let , 1 - ' , 23] , 'Let-23 1 , r) . 
may, probability, [may, be] , possible, r) . 

myc, protein, [myc, '-', p70s6kd3e] , ' Myc-p70s6kD3E ' , r ) . 
myc, protein, [myc, '-', pdkl] , ' Myc-PDKl 1 , r) . 
myc, protein, [myc, ' - ' ,p70s6k] , 'Myc-p70s6k' ,r) . 
myc, protein, [myc, ' - 1 , p70s6ke389d3e] , ' Myc-p70s6kE389D3E ' , r) 



myr , protein, [myr, » - ' , akt] , 'Myr-Akt ' , r) . 

n, protein, [n, ' - ' , methyl, 1 - ' ,d, ' - ' , aspartate, receptor] , 1 N 
r) . 

n, protein, [n, ' - ' , methyl, ' - ' ,d, ' - ' , aspartate] , ' NMDA ' ) . 
native, cell, [native , h4 , cell] ,' native H4 cell',r). 
nf , protein, [nf , ■ -','[' , kappa, ' ] ■ , b] , 'NF- [kappa] B ' , r) . 
nh2, site, [nh2 ,'-', terminal] , ' NH2 -terminal ', r) . 
nh2 , substance, [nh2 , * -', terminal , fragment] , ' NH2 -terminal fr 
,r) . 

nih, cell, [nih, '-', 3, t3, fibroblasts] , 'NIH-3T3 fibroblasts' 

nih,cell, [nih, '-• , '3t3' , fibroblasts] , 'NIH-3T3 fibroblasts' 

normal , substance, [normal, ntf] , 'normal NTF ' , r ) . 
nuclear, protein, [nuclear, factor, kappa, b] , 1 NF- [kappa] B ' 



phrase (plSOGlued, protein, [plSOGlued, - , arpl] , ' pl50Glued-Arpl ' , r) . 
phrase (phosphate , phosphorylate2 , [phosphate , incorporated , into] , 
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phosphorylate , r) . 

phrase (phosphatidylinositol , smallmolecule , [phosphatidylinositol , 1 
# , , , /4, , , , / 5,'- ! , triphosphate] , 'phosphatidylinositol 1,4,5-tripho 
sphate ' , r) . 

phrase (phosphoinositide, protein, [phosphoinositide, '-' dependent, 

protein, kinase], ' PDK1 ' , r) . 
phrase (phospholipase, protein, [phospholipase , c , 1 - ' , 1] , 'phospholip 
ase C-l 1 , r) . 

phrase (poly, protein, [poly, 1 ( ■ ,adp, ' - ' ,ribose, ' ) ' polymerase] , 'poly 
(ADP-ribose) polymerase' ,r) . 

phrase (polyvinyl idene, structure, [polyvinyl idene, difluoride, memb 
ranes] , ' polyvinylidene difluoride membranes' ,r) . 
phrase (presenil in, protein, [presenilin, 1] , 'presenilin 1 ■ , r) . 
phrase (presenilin, protein, [presenilin, 2] , ' presenilin, 2 ', r) ... 
phrase (productively, state, [productively, stimulated] , active, r) . 
phrase (protein, protein, [protein, tyrosine , kinase] , 'protein tyrosi 
ne kinase ' , r) . 

phrase (protein, protein, [protein, kinase , c] , 'protein kinase C ,r) . 
phrase (ps2 , substance, [ps2 ,'-', ctf] ,' presenilin 2 COOH-terminal fra 
gment ' , r) . 

phrase (ps2 , substance, [ps2 , cleavage, fragment ] , 'presenilin 2 cleava 
ge fragment ' , r) . 

phrase (pvdf, structure, [pvdf, membranes] , 'polyvinylidene difluori 
de membranes ' , r) . 

phrase (raf, protein, [raf,' -',!], 'Raf-l', r) . 
phrase (raf , protein, [raf , ' - 1 , 1] , 'Raf-l ' , r) . 
phrase (rapl , complex, [rapl , 1 - ' , gtp] , ' Rapl-GTP ' , r) . 
phrase (requirement , need2 , [requirement, for], need,r). 
phrase (ser, smallmolecule, [ser, 19], ' Ser 19 ',r). 
phrase (ser, smallmolecule, [ser, 23], 'Ser 23', r). 

phrase (serine, substance, [serine, residues], 'serine residues', r 
) . 

phrase(src, domain, [src, homology, 2], 'Src homology 2 ' , r) . 
phrase(src, domain, [src, homology, 3], 'Src homology 3 ' , r) . 
phrase (srebp, protein, [srebp, 1] , ' sterol -regulatory element bin 
ding protein 1 ' , r) . 

phrase (srebp, protein, [srebp, 1 -', 2] , ' sterol -regulatory element bin 
ding protein 2 ' , r) . 

phrase (sterol , protein, [sterol, ' - • , regulatory, element , binding, prote 
in,l] , 1 sterol -regulatory element binding protein l',r) . 
phrase (sterol, protein, [sterol, '-' , regulatory , element , binding, prote 
in,-2] , 1 sterol -regulatory element binding protein 2',r) . 
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phrase (t, cell, [t , ' - ' , dr7] , 1 t-DR7 1 , r) . 

phrase (t, cell, [t , ' - 1 ,drt, 7 1 ,b7, ' - M] , 1 t-DR7/B7-l ' , r) . 
phrase(t, cell, [t,cell], *T cell',r). 
phrase(t, cell, [t, cells], 'T cell',r). 

phrase (t, complex, [t, ' - ' , cell , receptor] , 'T-cell receptor' , r) . 

phrase (t , cell, [t , ' - ' , dr7, cells] , ' t-DR7 cells ' , r) . 

phrase (t,cell, [t, ' - ' ,dr7, ' / ' ,b7, ' - M] , ' t-DR7/B7-l • , r) . 

phrase (t, complex, [t cell , antigen, receptor] , ■ T-cell antigen rec 

eptor 1 , r) . 

phrase (threonine , aminoacid, [threonine, 229], 'threonine 229' , r) 

phrase (transcription, protein, [transcription, factor], 'transcript 
ion factor 1 , r) . 

phrase ( trypan, smallmolecule , ' trypan blue ' , r) . 
phrase (wt, protein, [wt, akt] , 'WTAkt',r). 
. phrase (zap, protein," [zap, 1 - 1 , 70], ' ZAP- 70 1 , r) . 

phrase (zdevd, smallmolecule, [zdevd, ' - ' , f mk] , ' zDEVD-fmk' , r) . 



□ 

ss. 

m 


phrase (il, protein, [il, 1 - ' , 3] , ' interleukin- 


wdef 


(ab, complex, antibody) . 


wdef 


(actin, protein, actin) . 


ST. 


wdef 


(activated, state, active) . 




wdef 


(active, state, active). 


til 

fii 


wdef 


(ad, disease, 'Alzheimer' ' ' 's disease') . 


wdef 


(age, protein, *AGC') . 




wdef 


(akt, protein, 'AKT'). 




wdef 


(anergic , state , inactive) . 




wdef 


(anergic , state , inactive) . 




wdef 


(anergy, state , inactive) . 




wdef 


(antibody , complex, antibody) . 


O 


wdef 


(antigen, substance, antigen) . 


C3 


wdef 


(aop, protein, *Aop'). 




wdef 


(apoptosis, process, apoptosis) . 




wdef 


(bad, protein, 'BAD'). 




wdef 


(c3g, protein, ' C3G 1 ) . 




wdef 


( ' ca2 + ' , smallmolecule, 1 Ca2+ ' ) . 




wdef 


(cas, protein, ' Cas ' ) . 




wdef 


(caspase , protein, caspase) . 




wdef 


(caspase , protein, caspase) . 




wdef 


(cbl, protein, ' Cbl ' ) . 




wdef 


(ccrsrh, protein, 'CCRSrh') . 




wdef 


(cd28, protein, 'CD28'). 




wdef 


(cells, structure, cell) . 




wdef 


(cholesterol , smallmolecule , cholesterol) . 
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wdef 


(cpp32 , protein, 1 CPP32 ' ) . 




wdef 


(crkl, protein, 'CrkL'). 




wdef 


(ctf, substance, ' COOH- terminal fragment') . 




wdef 


(cytokine, smallmolecule , cytokine) . 




wdef 


(cytosol, structure, cytosol) . 




wdef 


(djnk,protein, ' D JNK ' ) . 




wdef 


(djun, protein, 'DJun'). 




wdef 


(dynamitin, protein, dynamitin) . 




wdef 


(erk, protein, 1 ERK' ) . 




wdef 


(eto, smallmolecule , 'ETO 1 ) . 




wdef 


(etoposide, smallmolecule, etoposide) . 




wdef 


(fad, disease, 'familial Alzheimer* ' ' 's disease 




wdef 


(fyn, protein, 'Fyn'). 




wdef 


(gdp, smallmolecule, 'GDP') . 




wdef 


(gelsolin, protein, gelsolin) . 




wdef 


(gpl20,protein, *gpl20 l ) . 




wdef 


(grb2, protein, 'Grb2'). 




wdef 


(gst, protein, 'glutathione S-transf erase ') . 


k "l 


wdef 


(gtp, smallmolecule, ' GTP • ) . 




wdef 


(hsp70, protein, ' HSP70 ' ) . 


~ -~ 


wdef 


(human, species, human) . 




wdef 


(ikk, protein, ' IKK' ) . 




wdef 


(inactivated, state, inactive) . 


fii 


wdef 


(inactive, state, inactive) . 




wdef 


(jnk, protein, 'JNK'). 


r "3 


wdef 


(jnk, protein, 'JNK'). 




wdef 


(jnk2, protein,' JNK2 ' ) . 




wdef 


(kap3 , protein, kap3) . 




wdef 


(kdakt, protein, ' KDAkt ' ) . 


i=? 


wdef 


(kinase, protein, kinase) . 


LI 


wdef 


(kinectin, protein, kinectin) . 




wdef 


(klc, protein, klc) . 




wdef 


(lamin, protein, lamin) . 




wdef 


(myosins , protein, myosins) . 




wdef 


(nmdar, protein, ' NMDAR ' ) . 




wdef 


(nmdar2b, protein, ' NMDAR2B ' ) . 




wdef 


(ntf, substance, ' NH2 -terminal fragment') . 




wdef 


(p70s6k, protein, p70s6k) . 




wdef 


(p78s6k, protein, p78s6k) . 




wdef 


(parp, protein, ' poly (ADP-ribose) polymerase 1 ) . 




wdef 


(pdkl , protein, ' PDK1 • ) . 




wdef 


(peptides, protein, peptide) . 




wdef 


(pkb, protein, 1 PKB ' ) . 
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wdef (pkc, protein, 'protein kinase C). 
wdef (position, site, site), 
wdef (positions, site, site) . 
wdef (protease , protein, protease) . 
wdef (psl , protein, 'presenilin 1') . 
wdef (ps2 , protein, 'presenilin 2') . 
wdef(rapl, protein, 'Rapl'). 
wdef(ras, protein, 'Ras'). 
wdef (receptors , substance, receptor) . 
wdef(rela, protein, ' RelA ' ) . 
wdef (residues , substance , residue) . 
wdef (responsive, state, active). 
wdef(s6, protein, ' S6 ' ) . 

wdef (selectively , constraint, selective) . 

wdef(serll2, site, 'Serll2'). 

wdef (serl36-,. site, 'Serl36'). 

wdef (ser32, smallmolecule , 'Ser32') . 

phrase (psl , protein 

wdef (ser36, smallmolecule, 'Ser36') . 

phrase(psl, protein, [psl , ' - ' , ctf ] , ' psl-ctf ' , r) . 

wdef (sh2 , domain, • SH2 1 ) . 

wdef (sh3 , domain, ' SH3 * ) . 

wdef (she, protein, 'She'). 

wdef (signal some, complex, signalsome) . 

wdef (sites, site, site) . 

wdef ( sos, protein, ' Sos ' ) . 

wdef (staurosporine, smallmolecule, staurosporine) . 

wdef (sts, smallmolecule, ' STS ' ) . 

wdef(tcr, complex, 'T-cell receptor'). 

wdef (tetracycline, smallmolecule, tetracycline) . 

wdef (thr229, aminoacid, 'Thr229') . 

wdef (thr308 , aminoacid, 'Thr308') . 

wdef(thr389, aminoacid, 'Thr389'). 

wdef ( threonine , aminoacid , threonine ) . 

wdef (tyrosine , aminoacid, tyrosine) . 

wdef (unresponsive, state, inactive) . 

wdef (unstimulated, state, inactive) . 

wdef (zvad, smallmolecule, ' zVAD') . 
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% lexsyn.pat 

% revised March 17, 2000 

% SYNTACTIC LEXICON FOR ACTIONS 

% Contains syntactic entries for action type words and phrases 



% synp (+Wordl , +Wordlist , +Syn) 

% synp: Wordl is first word of phrase, Wordlist is list of words i 
n phrase 

% synp: Syn is syntactic categorey 
% 

% synw (+Word, +Syn) is same as synp except there is no wordlist 
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% 

synp (account , [account , for] , v) . 

synp (account , [account , for] ,vp) . 

synp (accounted, [accounted, for] ,ved) . 

synp (accounted, [accounted, for] ,ven) . 

synp (accounting, [accounting, for] ,ving) . 

synp (accounting, [accounting, for] , n) . 

synp (accounts , [accounts , for] ,vp) . 

synp(add, [add, up] ,vp) . 

synp (add, [add, up] , v) . 

synp (added, [added, up] ,ved) . 

synp (added, [added, up] ,ven).. 

synp (adding, [adding, up] , n) . 

synp (adding, [adding, up] ,ving) . , 

synp (adds, [adds, up] ,vp) . 

synp (am, [am, a, means, of , producing] ,vp) . 

synp (am, [am, due, to] ,vp) . 

synp(are, [are, a, means, of , producing] ,vp) . 

synp (are, [are, due, to] ,vp) . 

synp(as, [as , a, result , of ] ,prep) . 

synp (attributable, [attributable , to] ,vp) . % ? 

synp (attributed, [attributed, to] ,ven) . 

synp (based, [based, on] ,ven) . 

synp (based, [based, upon] ,ven) . i 

synp (be, [be, a, means, of , producing] ,v) . 

synp (be, [be, due, to] ,v) . 

synp (because, [because, of] ,prep) . 

synp (been, [been, a, means , of , producing] ,ven) . 

synp (been, [been, due, to] ,ven) . 

synp (being, [being, a, means, of , producing] ,n) . 

synp (being, [being, a, means, of , producing] ,ving) . 



% 
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being, . [being, due, to] , n) . 
being, [being, due , to] ,ving) . 
caused, [caused, by] ,ved) . 
caused, [caused, by] ,ven) . 
convey, [convey, a, signal] ,v) . 
convey, [convey, a, signal] ,vp) . 
conveyed, [conveyed, a, signal] ,ved) . 
conveyed, [conveyed, a, signal] ,ven) . 
conveying, [conveying, a, signal] , ving) 
conveying, [conveying, a, signal] ,n) . 
conveys, [conveys, a, signal] ,vp) . 
dissociate, [dissociate, from] ,vp) . 
dissociate, [dissociate , from] ,v) . 
dissociated, [dissociated, from] ,ved) . 
dissociated, [dissociated, from] ,ven) . 
dissociated, [clissociates , from] ,vp) . 
dissociating, [dissociating, from] ,n) . 
dissociating, [dissociating, from] ,ving) 
dissociation, [dissociation, from] ,n) . 



down, [down, ' - 
down, [down, ' - 
B 

down, [down, 1 - 
down, [down, ' - 
down, [down, 1 - 
down, [down, ' - 
down, [down, 1 - 
down, [down, 1 - 



, regulate] , v) . 
, regulate] , vp) 



A down-regulates B 



A 



, regulated] ,ved) . 
, regulated] ,ven) . 
, regulates] , vp) . 
, regulating] , n) . 
, regulating] ,ving) . 
, regulation] , n) . 
due , [due , to , the , fact , that ] , ad j ) . 
due, [due, to] , ad j ) . % ? 
form, [form, complex] , v) . 
form, [form, complex] ,vp) . 
formation, [formation, of, complex] ,n) 
formed, [formed, complex] ,ved) . 
formed, [formed, complex] ,ven) . 
forming, [forming, complex] ,n) . 
forming, [forming, complex] ,ving) . 
forms, [forms, complex] ,vp) . 
had, [had, an, active, role, in] , ved) . 
had, [had, an, active, role, in] ,ven) . 
has, [has, an, active, role, in] ,vp) . 
have, [have, an, active, role, in] ,v) . 
have, [have, an, active, role, in] ,vp) . 
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synp 


(n, 


[n, 


synp 


(n, 


[n, 


synp 


(n, 


[n, 


synp 


In, 


[n, 


synp 


(n, 


[n, 


synp 


(n, 


[n, 


synp 


(n, 


[n, 


synp 


(n, 


[n, 


synp 


(n, 


[n, 


synp 


(n, 


[n, 


synp 


(n, 


[n, 


synp 


(n, 


[n, 


synp 


(n, 


tn, 


synp 


(n, 


[n, 


synp 


(n, 


[n, 


synp 


(n, 


[n, 


synp 


In, 


[n, 


synp 


(n, 


[n, 


synp 


(n, 


[n, 


synp 


(n, 


[n, 



having, [having, an, active , role,. in] , n) . 
having, [having, an, active, role, in] ,ving) . 
is, [is, a, means, of , producing] ,vp) . 
is, [is, due, to] , vp) . 

functions, [ functions , as , a , negative , regulator , of ] ,vp) . 

function, [function, as , a, negative , regulator , of ] ,vp) . 

lead, [lead, to] , v) . 

leads, [leads, to] ,vp) . 

leading, [leading, to] ,n) . 

leading, [leading, to] ,ving ) . 

leads, [leads, to] ,vp ). 

led, [led, to] ,ved) . 

led, [led, to] ,ven) . 

may, [may , be , responsible , for] ,vp) . 

mediate, [mediate, a, signal], v) . %A mediates a signal to 

mediate, [mediate, a, signal] , vp) . ' 
mediated, [mediated, a, signal] , ved) . 
mediated, [mediated, a, signal] , ven) . 
mediates, [mediates, a, signal] , vp) . 
mediating, [mediating, a, signal] , n) . 
mediating, [mediating, a, signal] , ving) . 
mediation, [mediation, of , a, signal], n). 
, [n, 1 - ' , acetyl ate] , v) . 
, [n, ' - ' , acetylate] , vp) . 
, [n, ' - 1 , acetylated] , ved) . 
, [n, 1 - ' , acetylated] , ven) . 
, [n, ' - ' , acetyl ates] , vp) . 
, [n, ' - ' , acetylating] , n) . 
, [n, ' - 1 , acetylating] , ving) . 
, [n, 1 - 1 , acetylation] , n) . 
, [n, ' - 1 , acylate] , v) . 
, [n, ' - 1 , acylate] , vp) . 
, [n, 1 - 1 , acylated] , ved) . 
, [n, ' - ' , acylated] , ven) . 

, [n, 1 - 1 , acylates] , vp) . i 
, [n, ■ - ■ , acylating] , n) . 
, [n, 1 - ' , acylating] , ving) . 
, [n, ' - ' , acylation] , n) . 
, [n, ' - ' , glycosylate] , v) . 
/ [n, • - ■ glycosylate] , vp) . 
, [n, ' - * glycosylated] ,ved) . 
, [n, ' - * glycosylated] ,ven) . 
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synp(n, [n, 
synp(n, [n, 
synp(n, [n, 
synp (n, [n, 
synp (n, [n, 
synp (o, [o, 
synp(o, [o, 
synp (o, [o, 
synp(o / [o, 
synp (o, [o, 
synp(o, [o, 
synp(o / [o, 
synp(o, [o, 
synp (only, 
synp (prolyl , 
synp (prolyl , 
synp (prolyl , 
synp (prolyl , 
synp (prolyl , 
synp (prolyl , 
synp (prolyl , 
synp (prolyl , 
synp (result , 
synp (result , 



- 1 /glycosylates] , vp) . 
- ' /glycosylating] , n) . 
- ' /glycosylating] ,ving) . 
- ' ,glycosylation] ,n) . 
- ' , terminal /proteolysis] , n) 

- 1 /glycosylate] ,v) . 
- ' /glycosylate] ,vp) . 
- ' /glycosylated] ,ved) . 

- 1 /glycosylated] ,ven) . 
- ' /glycosylates] , vp) . 
- ■ /glycosylating] ,n) . 

- 1 / glycosylating]., ving) . 
- ■ , glycosylation] ,n) . 
[only, after], , prep) . 



[prolyl, ' - \ 4, 
[prolyl ,'-',4, 
[prolyl,.'-' f 4, 
[prolyl, ' - ' , 4, 
[prolyl, ' - ' ,4, 
[prolyl , ' - ' , 4 , 
[prolyl, ■-' ,4, 
[prolyl, 1 - 1 , 4, 
[result , from] , v) . 
[result , from] , vp) . 
synp (result, [result, in] ,v) . 
synp (result, [result, in] ,vp) . 
synp (resulted, [resulted, from] ,ved) . 

[resulted, from] ,ven) . 
[resulted, in] ,ved) . 
[resulted, in] ,ven) . 
[resulting, from] ,n) . 
[resulting, from] ,ving) 
[resulting, in] ,n) . 
synp (resulting, [resulting , in] ,ving) . 
synp (results, [results , from] ,vp) . 
synp (results, [results, in] ,vp) . 
synp(set, [set, free],v). 
synp(set, [set, free],v). 
synp(set, [set, free],ved). 
synp(set, [set, free],ved). 
synp (set, [set, free] ,ven) . 
synp(set, [set, free] ,ven) . 
synp(set, [set, free],vp). 



, hydroxylate] , v ) . 
, hydroxylate] , vp) . 
, hydroxylated] , ved ) 
, hydroxylated] ,ven ) 
, hydroxylates] ,vp) . 
, hydroxy 1 at ing] , n ) . 
, hydroxylating] ,ving 
, hydroxylation] ,n) . 



synp (resulted, 
synp (resulted, 
synp (resulted, 
synp (resulting, 
synp (resulting, 
synp (resulting, 
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set, [set, free] ,vp) . 
sets, [sets, free] ,vp) . 
sets, [sets, free] ,vp) . 
setting, [setting, free] ,n) . 
setting, [setting, free] ,n) . 
setting, [setting, free] ,ving) . 
setting, [setting, free] ,ving) . 
suppress, [suppress, activity, of] ,v) . 
suppress, [suppress, activity, of] ,vp) . 
suppressed, [suppressed, activity, of] ,ved) . 
suppressed, [suppressed, activity, of] ,ven) . 
suppresses, [suppresses, activity, of] ,vp) . 
suppressing, [suppressing, activity, of],n). 
suppressing, [suppressing, activity, of] ,ving) . 
suppression, [suppression, of , activity, of],n). 
switch, [switch, on, the, activity, of] ,vp) . 
switched, [switched, on, the, activity, of] ,ved) 
switched, [switched, on, the, activity, of] ,ved) 
switched, [switched, on, the, activity, of] ,ved) 
switched, [switched, on, the, activity, of],ved) 
switched, [switched, on, the, activity, of],ved) 
switches, [switches, on, the, activity, of] ,vp) . 



up, [up, 
up, [up, 
up, [up, 
up, [up, 
up, [up, 
up, [up, 
up, [up, 
up, [up, 



, regulate] , v) . % A up-regulates B B A 
, regulate] ,vp) . % A up-regulates B B --> A 
, regulated] , ved) . 

% A up-regulates B B --> A 



, regulated] ,ven) . 
, regulates] , vp) . 
, regulating] ,n) . 
, regulating] ,ving 
, regulation] , n) . 
was , [was , a , means , of , producing] , ved) . 
was, [was, due, to] ,ved) . 
were, [were, a, means, of , producing] ,ved 
were, [were, due, to] ,ved) . 
acetylate , v) . 
acetylate , vp) . 
acetylated, ved) . 
acetylated, ven) . 
acetylates, vp) . 
acetylating, n) . 
acetylating, ving) . 
acetylation, n) . 
activate, v) . 



A up-regulates B B --> A 
% A up-regulates B B --> A 
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synw (activate, vp) . 
synw (activated, ved) . 
synw (activated, ven) . 
synw (activates , vp) . 
synw (activating, n) . 
synw (activating, ving) . 
synw (activation, n) . 
synw (add, v) . 
synw (add, vp) . 
synw (added, ved) . 
synw (added, ven) . 
synw (adding, n) . 
synw (adding, ving) . 
synw (addition, n) . 
synw (adds , vp) . 
synw (after , prep) . 
synw (aggregate ,v) . 
synw (aggregate ,vp) . 
synw (aggregated ,ved) . 
synw (aggregated ,'ven) . 
synw (aggregates ,vp) . 
synw (aggregating , n) . 
synw (aggregating ,ving) . 
synw (aggregation , n) . 
synw (arrest, n) . 
synw (arrest , v) . 
synw (arrest , vp) . 
synw (arrested, ved) . 
synw (arrested, ven) . 
synw (arresting, n) . 
synw (arresting, ving) . 
synw (arrests , vp) . 
synw (associate, v) . 
synw (associate, vp) . 
synw (associated, ved) . 
synw (associated, ven) . 
synw (associates, vp) . 
synw (associating, n) . 
synw (associating, ving) . 
synw (association, n) . 
synw (attach ,v) . 
synw (attach, vp) . 
synw (attached ,ved) . 
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synw (attached , ven) . 

synw (attaches, vp) . 

synw (attaching ,n) . 

synw (attaching , ving) . 

synw (attachment , n) . 

synw (bind, v) . 

synw (bind, vp) . 

synw (binding, n) . 

synw (binding, ving) . 

synw (binds , vp) . 

synw (block, v) . 

synw (block, vp) . 

synw (blockage, n) . 

synw (blocked, ved) . 

synw (blocked, ven) . 

synw (blocking; n ) . 

synw (blocking, ving) . 

synw (blocks , vp) . 

synw (bound, ved) . 

synw (bound, ven) . 

synw (break, v) . 

synw (break, vp) . 

synw (breakage, n) . 
synw (breaking, n) . 
synw (breaking, ving) . 
synw (breaks, vp) . 
synw (broke, ved) . 
synw (broken, ven) . 
synw (catalyzation, n) . 
synw (catalyze , v) . 
synw (catalyze, vp) . 
synw (catalyzed, ved) . 
synw (catalyzed, ven) . 
synw (catalyzes, vp) . 
synw (catalyzing, n) . 
synw (catalyzing, ving) . 
synw (causation, n) . 
synw (cause, n) . 
synw (cause, v) . 
synw (cause , ven) . 
synw ( cause, vp) . 
synw (caused, ved) . 
synw (causes , vp) . 



Page 7 



lexsyn. pat . txt 





synw 


(causing, n) . 




synw 


(causing, ving) . 




synw 


(cleavage , n) . 




synw 


(cleave , v) . 




synw 


(cleave , vp) . 




synw 


(cleaved, ved) . 




synw 


(cleaved, ven) . 




synw 


(cleaves, vp) . 




synw 


(cleaving, n) . 




synw 


(cleaving, ving) . 




synw 


(coimmunoprecipitate ,v) . 




synw 


(coimmunoprecipitate, vp) . 




synw 


(coimmunoprecipitated , ved) . 




synw 


( c o i mmunop re cipitated , ven) . 




synw 


(coimmunoprecipitates , vp) . 




synw 


(coimmunoprecipitating ,n) . 




synw 


(coimmunoprecipitating , ving) 


□ 


synw 


(coimmunoprecipitation ,n) . 




synw 


(combination ,n) . 


Ul 


synw 


(combine ,v) . 




synw 


(combine ,vp) . 


til 


synw 


[ combined , ved) . 


C(l 
f[| 


synw 


[combined ,ven) . 




synw 


[combines, vp) . 


"ii 


synw 


[combining , n) . 


0 


synw 


[combining ,ving) . 




synw 


[conjugate , v) . 


I i 

r == 


synw 1 


[conjugate ,vp) . 


r :: s 


synw ( 


'conjugated ,ve) . 


: - 
'* = 5 


synw { 


conjugated ,ved) . 


c :r 


synw i 


conjugates , vp) . 




synw ( 


conjugating ,n) . 




synw i 


conjugating ,ving) . 




synw ( 


conjugation ,n) . 




synw ( 


connect ,vp) . 




synw I 


connect, v) . 




synw < 


connected , ve) . 




synw ( 


connected ,ved) . 




synw ( 


connecting , n) . 




synw I 


connecting ,ving) . 




synw ( 


connection ,n) . 




synw ( 


connects , vp) . 




synw (constrain, v) . 
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\ luuo l x. d_Lii ; v^jy . 






\ L LJi lo LI axiicu , V t-Ll / . 




o y iiw 


( /lAnol-ra *i n -iron ^ 




synw 


( rnn g t* i n t nn n ^ 
V v— • \*j no li o. xiij-i iy f ±1 j 




o yiiw 


{ fnnch T~ n n l Tin "\ 7" ~i n r-t ^ 

v l-luio l j_ ct ni-L ny / V iiiy / > 




Dyiiw 






o yiiw 


( r , r~^TiQt~"K~^ "i Tit" ti ^ 




o y iiw 


\ \J L> J_ CT L- X. L* 1 LuLC ( V y . 




oy iiw 


( rnnTPr i t*h h ai - p "\tt^^ 

\ WW J_ C L. X k/ X LaLC / V LJ ) . 




oy iiw 


( (-1 r~\y) ~y ci (~* -j •pji hafpH -\rp r\ \ 
\ L>Upi CUly X LuLCU f V CU J ■ 




d y iiw 


/ oor-jT*^ f"* i "o "i 1~ ^ t~ o H -irp ti \ 

CL1 LyX LuLCU , V Cll/ . 




synw 


( /"i v* d r+ i y\ i i - 3 f" r~i -r \ 
\COprcCipiL.aLcS , Vp y . 




oy iiw 


V l.lj lji t; x^x L a. L 1 iiy / II / • 




syi iw 


1 f~* f"Vr*Vr r " '*i "r'l"! "1 ' ^ f~ i inn iri TV/"* i 
\ L» UU I C L- J. X La L XI 1M ^ V 11 1LJ y . 




oyiiw 


f rnnypp i i t" 3 h i at-i T"i \ 

\ LUpX CL XpX Lu. 1 LLvil f 11/ . 




oy iiw 


\LUpUX IxlLaLXOn . 




synw 


icopui liieu , veuj . 


r ~i 


synw 


i copuiivi j_ 1 cru. , venj . 




oy IIW 


iLUpUIllXcb, vpj . 


1=1 


synw 


PATM 1 >*1 fir T7T\ ] 

^ copu.ivj_ j_ y , vp; . 




synw 


1 copuri ry , . 


H J 


synw 


k copuriiyiny ,n; . 


ni- 
ts ; s 


synw 


^opuriiying , vmy J . 


V £ 


synw 


k coupic / vp; . 




awn t*7 

oy iiw 


.LUUpic / V f . 


1=1 
c 


synw 


t coupiea , veuj . 


synw 


k coupiea, ven/ . 


jjss 


synw 


couples, vp) . 




synw 


^coupling, nj . 


f = t: 
f:sr 


oyiiw 


i coupi my ; ving j . 


f S | 


oyiiw 


^ LUL / 11 ) . 




o y iiw 


t L. LI L / V ) m 




D YIIW 1 


LUL r VCH/ • 




o y iiw 1 


/nil 4- -rrfifi I 

\— U. L f Veil J . 




synw i 


CUl , vp ; . 




synw i 


culs , vp; . 




synw i 


cut t ing , n) . 




synw i 


cuccing, vingj . 




synw i 


deactivate , v) . 




synw ( 


deactivate, vp) . 




synw ( 


deactivated, ved) . 




synw ( 


deactivated, ven) . 




synw ( 


deactivates, vp) . 
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deactivating, n) . 
deactivating, ving) . 
deactivation,^ . 
death, n) . 
demethylate, v) . 
demethylate, vp) . 
demethylated, ved) . 
demethylated, ven) . 
demethylates , vp) . 
demethylating, n) . 
demethylating, ving) . 
demethylation, n) . 
dephosphorylate, v) . 
dephosphoryiate , vp) . 
dephosphorylated, ved) . 
dephosphorylated, ven) . 
dephosphorylates, vp) . 
dephosphorylating, n) . 
dephosphorylating, ving) 
dephosphorylation, n) . 
die,v) . 
die,vp) . 
died, ved) . 
died, ven) . 
dies,vp) . 
disassemble, v) . 
disassemble, vp) . 
disassembled, ved) . 
disassembled, ven) . 
disassembles, vp) . 
disassembling, n) . 
disassembling, ving) . 
disassembly, n) . 
discharge, n) . 
discharge, v) . 
discharge, vp) . 
discharged, ved) . 
discharged, ven) . 
discharges, vp) . 
discharging, n) . 
discharging, ving) . 
disengage , v) . 
disengage , vp) . 
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(disengaged, ved) . 
(disengaged, ven) . 
(disengagement , n) . 
(disengages, vp) . 
(disengaging, n) . 
(disengaging, ving) 
(divide , v) . 
(divide, vp) . 
(divided, ved) . 
(divided, ven) . 
(divides, vp) . 
(dividing, n) . 
(dividing, ving) . 
(division, n) . 
(dying, n) . 
(dying , ving)". 
(enhance, v) . 
(enhance, vp) . 
' (enhanced, ved) . 
(enhanced, ven) . 

■ (enhancement, n) . 
(enhances, vp) . 
(enhancing, n) . 
(enhancing, ving) . 
(express, v) . 
(express, vp) . 
(expressed, ved) . 
(expressed, ved) . 
(expressed, ven) . 

■ (expresses ,vp) . 
(expressing, n) . 
(expressing, n) . 
(expressing, ving) . 
(expression, n) . 
(generate, v) . 
(generate, vp) . 
(generated, ved) . 
(generated, ven) . 
(generates, vp) . 
(generating, n) . 
(generating, ving) . 
(generation, n) . 
(hew, v) . 
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synw (hew, vp) . 
synw (hewed, ved) . 
synw (hewed, ven) . 
synw (hewing, n) . 
synw (hewing , ving) . 
synw (hews , vp) . 
synw (hinder , v) . 
synw (hinder , vp) . 
synw (hindered, ved) . 
synw (hindered, ven) . 
synw (hindering, n) . 
synw (hindering, ving) . 
synw (hinders , vp) . 
synw (hindrance , n) . 
synw (inactivate , v) . 
synw (inactivate, vp) . 
synw (inactivated, ved) . 
synw (inactivated, ven) . 
synw (inactivates , vp) . 
synw (inactivating, n) . 
synw (inactivating, ving) . 
synw (inactivat ion, n) . 
synw (incite , v) . 
synw (incite, vp) . 
synw (incited, ved) . 
synw (incited, ven) . 
synw (incitement , n) . 
synw (incites , vp) . 
synw (inciting, n) . 
synw (inciting, ving) . 
synw (induce , v) . 
synw (induce, vp) . 
synw (induced, ved) . 
synw (induced, ven) . 
synw (induces , vp) . 
synw (inducing, n) . 
synw (inducing, ving) . 
synw (induction, n) . 
synw (influence , n) . 
synw (influence , v) . 
synw (influence , vp) . 
synw (influenced, ved) . 
synw (influenced, ven) . 
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synw (influences, vp) . 

synw (influencing, n) . 

synw (influencing, ving) . % ? 

synw (inhibit , v) . 

synw (inhibit ,vp) . 

synw (inhibited, ved) . 

synw ( inhibited, ven) . 

synw (inhibiting, n) . 

synw (inhibiting, ving) . 

synw (inhibition, n) . 

synw (inhibits, vp) . 

synw (initiate, v) . 

synw (initiate, vp) . 

synw (initiated, ved) . 

synw (initiated, ven) . 

syriw (initiates, vp) . 

synw (initiating, n) . 

synw (initiating, ving) . 

synw (initiation, vp) . 

synw ( instigate , v) . 

synw (instigate, vp) . 

synw (instigated, ved) . 

synw (instigated, ven) . 
synw (instigates, vp) . 
synw (instigating, n) . 
synw (instigating, ving) . 
synw (instigation, n) . 
synw (interact ,v) . 
synw (interact , vp) . 
synw (interacted, ved) . 
synw (interacted, ven) . 
synw (interacting, n) . 
synw (interacting, ving) . 
synw ( interaction, n) . 
synw (interactions, n) . 
synw ( interacts, vp) . 
synw (join , vp) . 
synw(join,v) . 
synw (joined, ved) . 
synw (joined, ven) . 
synw (joining, n) . 
synw (joining, ving) . 
synw (joins, vp) . 
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synw (juncture , n) . 
synw (liberate , v) . 
synw (liberate , vp) . 
synw (liberated, ved) . 
synw (liberated, ven) . 
synw (liberates, vp) . 
synw (liberating, n) . 
synw (liberating, ving) . 
synw (liberation, n) . 
synw (limit , v) . 
synw (limit , vp) . 
synw (limitation, n) . 
synw (limited, ved) . 
synw (limited, ven) . 
synw (limiting, n) . 
synw (limiting, ving) . 
synw (limits, vp) . 
synw (link, n) . 
synw (link, v) . 
synw (link, vp) . 
synw (linked, ved) . 
synw (linked, ven) . 
synw (linking, n) . 
synw (linking, ving) . 
synw (links, vp) . 
synw (mediate, v) . 
synw (mediate ,vp) . 
synw (mediated, ved) . 
synw (mediated, ven) . 
synw (mediates, vp) . 
synw (mediating, n) . 
synw (mediating, ving) . 
synw (mediation, n) . 
synw (methyl ate, vp) . 
synw (methylate, v ) . 
synw (methylated, ved ) . 
synw (methylated, ven ) . 
synw (methylates , vp) . 
synw (methylating, n ) . 
synw (methyl a ting, ving ) . 
synw (methylation, n) . 
synw (modification, n) . 
synw (modified, ved) . 
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synw (modified, ven) . 
synw (modifies, vp) . 
synw (modify , v) . 
synw (modify , vp) . 
synw (modifying, n) . 
synw (modifying, ving) . 
synw (mutate , v) . 
synw (mutate, vp) . 
synw (mutated, ved) . 
synw (mutated, ven) . 
synw (mutates , vp) . 
synw (mutating, n) . 
synw (mutating, ving) . 
' synw (mutation, n) . 
synw (over express, v) . 
synw (bverexpress , vp) . 
synw (overexpressed, ved) . 
synw (overexpressed, ven) . 
synw (overexpresses , vp) . 
synw (overexpressing, n) . 
synw (overexpressing, ving) . 
synw (overexpress ion, n) . 
synw (pair, v) . 
synw (pair , vp) . 
synw (paired, ved) . 
synw (paired, ven) . 
synw (pairing, n) . 
synw (pairing, ving) . 
synw (pairs , vp) . 
synw (phosphorylate , n) . 
synw(phosphorylate, vp) . 
synw (phosphorylated, ved) . 
synw (phosphorylated, ven) . 
synw (phosphorylates , vp) . 
synw (phosphoryla ting, n) . 
synw (phosphorylating, ving) . 
synw (phosphorylation, n) . 
synw (promote, v) . 
synw (promote, vp) . 
synw (promoted, ved) . 
synw (promoted, ven) . 
synw (promotes , vp) . 
synw (promoting, n) . 
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synw (promoting, ving) . 
synw (promotion, n) . 
synw (prompt , n) . 
synw (prompt , v) . 
synw (prompt , vp) . 
synw (prompted, ved) . 
synw (prompted, ven) . 
synw (prompting, n) . 
synw (prompting, ving) . 
synw (prompts , vp) . 
synw (react , v) . 
synw (react , vp) . 
synw (reacted, ved) . 
synw (reacted, ven) . 
synw (reacting, n) . 
synw (reacting, ving) . 
synw (reaction, n) . 
synw (reacts, vp) . 
synw (regulate, v) . 
synw (regulate, vp) . 
synw (regulated, ved) . 
synw (regulated, ven) . 
synw (regulates , vp) . 
synw (regulating, n) . . 
synw (regulating, ving) . 
synw (regulation, n) . 
synw (release, n) . 
synw (release, v) . 
synw (release , vp) . 
synw (released, ved) . 
synw (released, ven) . 
synw (releases, vp) . 
synw (releasing, n) . 
synw (releasing, ving) . 
synw (removal , n) . 
synw ( remove , v) . 
synw ( remove , vp ) . 
synw (removed, ved) . 
synw (removed, ven) . 
synw (removes , vp) . 
synw (removing, n) . 
synw (removing, ving) . 
synw (replace, v) . 
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replace , vp) . 
replaced, ved) . 
replaced, ven) . 
replacement , n) . 
replaces , vp) . 
replacing,n) . 
replacing, ving) . 
repress, vp) . 
repress ,v) . 
repressed, ved) . 
repressed, ven) . 
represses, vp) . 
repressing, n) . 
repressing, ving) . 
repression, n) . 
require ,v) . 
require, vp) . 
required, ved) . 
required, ven) . 
requirement , n) . 
requires, vp) . 
requiring, n) . 
requiring, ving) . 
restrain, vp) . 
restrain, v) . 
restrained, ved) . 
restrained, ven) . 
restraining, ri) . 
restraining, ving) 
restrains, vp) . 
restraint , n) . 
sensitization, n) 
sensitize, vp) . 
sensitize, v) . 
sensitized, ved) . 
sensitized, ven) . 
sensitizes , vp) . 
sensitizing, n) . 
sensitizing, ving) 
separate, v) . 
separate, vp) . 
separated, ved) . 
separated, ven) . 
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(separates, vp) . 

(separating, n) . 

(separating, ving) . 

(separation, n) . 

(sever , v) . 

(sever , vp) . 

(severance, n) . 

(severed, ved) . 

(severed, ven) . 

(severing, n) . 

(severing, ving) . 

(severs, vp) . 

(signal , v) . 

(signal, vp) . 

(signaledy ved) . 

(signaled, ved j . 

(signaled, ven) . 

(signaling, n) . 

(signaling, ving) . 

(signals, vp) . 

(split , n) . 

(split , v) . 

(split , ved) . 

(split, ven) , 

(split, vp) . 

(splits, vp) . 
r (splitting, n) . 

(splitting, ving) . 

(stimulate, v) . 

(stimulate , vp) . 

(stimulated, ved) . 

(stimulated, ven) . 

(stimulates , vp) . 

(stimulating, n) . 

(stimulating, ving) . 

(stimulation, n) . 

(substitutes) . 

(substitute, vp) . 
r (substituted, ved) . 
' (substituted, ven) . 
r (substitutes , vp) . 

(substituting, n) . 

(substituting, ving) 
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synw (substitution, n) . 
synw (suppress , vp) . 
synw (suppress , v) . 
synw (suppressed, ved) . 
synw (suppressed, ven) . 
synw (suppresses , vp) . 
synw (suppressing, n) . 
synw (suppressing, ving) . 
synw (suppression, n ). 
synw (tie, n) . 
synw (tie ,v) . 
synw (tie, vp) . 
synw (tied, ved) . 
synw (tied, ven) . 
synw (ties , vp) . 
synw (transcribe, v) . 
synw(transcribe, vp) . 
synw (transcribed, ved) . 
synw (transcribed, ven) . 
synw (transcribes ,vp) . 
synw (transcribing, n) . 
synw (transcribing, ving). . 
synw (transcription, n) . 
synw (tying, n) . 
synw (tying, ving) . 
synw (ubiquitinization, n) . 
synw (ubiquitinize, v) . 
synw (ubiquitinize, vp) . 
synw (ubiquitinized, ved) . 
synw (ubiquitinized, ven) . 
synw (ubiquitinizes , vp) . 
synw (ubiquitinizing, n) . 
synw (ubiquitinizing, ving) . 
synw (urge , n) . 
synw ( urge, v) . 
synw (urge, vp) . 
synw (urged, ved) . 
synw (urged, ven) . 
synw (urges , vp) . 
synw (urging, n) . 
synw (urging, ving) . 

% the following are verbs connected with complexes 
synw (form, v) . 
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synw (f orm, vp) . 
synw (forms, vp) . 
synw (formed, ved) . 
synw (formed, ven) . 
synw (forming, n) . 
synw ( formation, n) . 
synw ( assemble, v) . 
synw (assemble , vp) . 
synw (assembles, vp) . 
synw (assembled, ved) . 
synw (assembled, ven) . 
synw (assembling, n) . 
synw (assembly , n) . 
synw (dissassemble, v) . 
synw (dissassemble, vp) . 
synw (dissassembles , vp) . 
synw (dissassembled, ved) . 
synw (dissassembled, ven) . 
synw (dissassembling, n) . 
synw (dissassembly, n) . 
synw (dissociate, v) . 
synw (dissociate, vp) . 
synw (dissociates, vp) . 
synw (dissociated, ved) . 
synw (dissociated, ven) . 
synw (dissociating, n) . 
synw (dissociation, n) . 
synw (recruit , v) . 
synw (recruit , vp) . 
synw (recruits , vp) . 
synw (recruited, ved) . 
synw (recruited, ven) . 
synw (recruiting, n) . 
synw (recruitment , n) . 
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% lexsemact . pat 

% revised March 17, 2000 

% SEMANTIC LEXICON OF ACTIONS 

%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% 

o o o o o o o 

%%%%%%% 

% For genomics - the grammar tests for semantic and syntactic cate 
gories 

% separately for action type of categories; for substances the lex 
ical 

% entries are the same as in the medical area 

% action type phrases have two entries: a semantic entry and a syn 
tactic entry 

% This lexicon contains the semantic entries for words and phrases 

.% .semp is a lexical entry for phrasal lexicon 
% semp (+Wordl , + Sem, +Wordlist , +Targetf orm, +Features) 
% semp specifies a semantic lexical definition for the genomics li 
terature 

% semp is equivalent to the predicate "phrase" in the medical area 
% semp: Wordl is first word of phrase, Sem is semantic category 
% semp: Wordlist is list of words in phrase, Targetform is output 
form 

% semp: Features is a list of 2 elements or the atom "def M represe 
nting defaul 

% semp: Features 1st element is rev or nrev meaning reversed or no 
t reversed 

% semp: Features 2nd element is a # specifying number of arguments 
for action 

% semp: Features = def is equivalent to a list = [nrev, 2] 
% in case action has 1 argument, use [1,_] 

%semw is a lexical entry for single word 
% semw (+Word, +Sem, +Targetf orm, ^Features) 

% semw: the arguments are the same as for semp except there is no 
Wordlist 

%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% 
%%%%%%%% 

:- multifile (semp/5) . 
:- multifile (semw/4 ) . 

semp (account . cause, [account , for] , cause, [def] ) . 
semp (accounted, cause, [accounted, for] , cause, [def]) . 
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semp (accounting, cause, [accounting, for] , cause, [def ] ) . 
semp (accounts , cause, [accounts , for] , cause, [def]) . 
semp(add, attach, [add, up], attach, [def]). 
semp (added, attach, [added, up], attach, [def]). 
semp(adds, attach, [adds, up], attach, [def]). 
semp (are, cause, [are, a, means, of , producing] , cause, [def] ) . 
semp (are, cause, [are, due, to] , cause, [2 , rev] ) . 
semp (as , cause, [as, a, result , of ] , cause, [2 rev] ) . 
semp (attributable, cause, [attributable, to] , cause, [2, rev]) . 
semp (attributed, cause, [attributed, to] , cause, [2, rev]) . 
semp (based, cause, [based, on] , cause, [2, rev] ) . 
semp (based, cause, [based, upon] , cause , [2, rev]) . 
semp (because, cause, [because, of ], cause, [2, rev]) . 
semp(convey, signal, [conveys, a, signal], signal, [def]). 
semp (conveyed, signal, [conveyed, a, signal], signal, [def]). 
semp (conveying, signal, [conveying, a, signal], signa-1 , [def]). 
J3emp (conveys , signal, [conveys, a, signal] , signal , [def]). 
semp (dissociate , release, [dissociate," from] , release, [def] ) . 
semp (dissociated, release, [dissociated, from] , release, [def]) . 
semp (dissociates, release, [dissociates, from], release, [def ]) . 
semp (dissociation, release, [dissociation, from], release, [def] ) . 
semp (down, signal , [down, , regulate] , signal, [def] ) . % A down- 
regulates B A --> B 
semp (down, signal , [down, ' - ' , regulated] , 
-regulates B A --> B 
semp (down, signal , [down, ' - ' , regulates] , 
-regulates B A --> B 
semp (down, signal , [down, ' - ' , regulation] 
n-regulates B A --> B 

semp (due, cause, [due, to, the, fact , that] , cause, [2 , rev] ) . 
semp (due , cause , [due , to] , cause , [2 , rev] ) . 
semp (form, attach, [form, complex], attach, [def]). 
semp (formation, attach, [formation, of, complex], attach, 
semp (formed, attach, [formed, complex], attach, [def]). 
semp(forms, attach, [forms, complex], attach, [def]). 
semp (had, cause, [had, an, active, role, in] , cause, [def]) . 
semp (has , cause , [has , an, active , role , in] , cause , [def] ) . 
semp (have, cause, [have, an, active, role, in] , cause, [def]) . 
semp (is, cause, [is, a, means, of , producing] , cause , [def]). 
semp (is , cause, [is, due , to] , cause, [2 , rev] ) . 

semp (functions, inactivate , [functions , as, a, negative, regulator , of ] , i 
nactivate, [def] ) . 

semp (function, inactivate, [function, as, a, negative, regulator , of ] , ina 



signal , [def] ) . 
signal , [def] ) . 
signal , [def] ) 



% A down 



% A down 



A dow 



[def]) 
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ctivate, [def ] ) . 

sempdead, cause, [lead, to] , cause, [def] ) . 
semp (lead, causel, [lead, to] , cause, [def]). 
semp (leading, cause, [leading, to] , cause, [def] ) . 
semp (leading, cause, [leading, to] , cause, [def]) . 
semp (leads , cause, [leads, to], cause, [def ]) . 
semp (leads, causel, [leads, to] , cause, [def] ) . 
semp (led, cause, [led, to] , cause, [def] ) . 

semp (may, cause, [may , be , responsible , for] , cause, [def]) . 
semp (mediate, signal, [mediate, a, signal], signal, [def]) 
mediates a signal to B 

[mediated, a 
B 

[mediates, a 
B 

[mediation, of , 



%A 



semp (mediated, signal , 
A mediates a signal to 
semp (mediates , signal , 
A mediates a signal to 
semp (mediation, signal , 



signal] , signal, [def] ) . 
signal] , signal, [def] ) . 
a, signal], signal, [def]) 



%A me dia tes a jsignal to B 



semp (n, 


createbond, 


[n, 


semp (n, 


createbond, 


[n, 


semp (n, 


createbond, 


[n, 


semp (n, 


createbond, 


[n, 


semp (n, 


createbond, 


[n, 


semp (n, 


createbond, 


[n, 


semp (n, 


createbond, 


[n, 


semp (n, 


createbond, 


[n, 


semp (n, 


createbond, 


[n, 


semp (n, 


createbond, 


[n, 


semp (n, 


createbond, 


[n, 


semp (n, 


createbond, 


[n, 


semp (n, breakbond, [n, 


i _ i 


sis' , [def] ) . 




semp (o, 


createbond, 


[o, 


semp (o, 


createbond, 


[o, 


semp (o, 


createbond, 


[o, 


semp (o, 


createbond, 


[o, 



,acetylate] , »N-acetylate *", [def J ) T 
,acetylated] , ' N-acetylate ' , [def] ) . 
,acetylates] , 'N-acetylate' , [def] ) . 
, acetylation] , 'N-acetylate* , [def] ) . 
, acylate] , ' N-acylate 1 , [def] ) . 
,acylated] , 'N-acylate' , [def] ) . 
,acylates] , 'N-acylate' , [def] ) . 
,acylation] , 'N-acylate' , [def] ) . 
glycosylate] , ' N-glycosylate ' , [def] ) . 
glycosylated] , 'N-glycosylate' , [def] ) . 
glycosylates] , 'N-glycosylate' , [def] ) . 
, glycosylation] , 'N-glycosylate' , [def] ) . 
-' , terminal proteolysis] , »n-terminal proteol 



' O-glycosylate ' , [def] ) . 
' O-glycosylate ' , [def] ) . 
'O-glycosylate' , [def] ) . 
, 'O-glycosylate' , [def] ) 
[2, rev] ) . 



- ' , glycosylate] , 
- ' , glycosylated] , 
- ' glycosylates] , 
- ' , glycosylation] 
semp (only, time, [only, after] , 'only after' , 
semp (prolyl , createbond, [prolyl , ■ - ' , 4 , ' - ' , hydroxylate] , 

' prolyl -4 -hydroxylate ' , [def] ) . 
semp (prolyl , createbond, [prolyl , ' - ' , 4 , ' - ' , hydroxylated] , 

' prolyl -4 -hydroxylate ' , [def] ) . 
semp (prolyl , createbond, [prolyl , ' - ' , 4 , ' - ' , hydroxylates] , 

' prolyl -4 -hydroxylate ' , [def] ) . 
semp (prolyl , createbond, [prolyl , ' - ' , 4 , ' - ' , hydroxylation] , 
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'prolyl -4 -hydroxylate ' , [def] ) . 
semp (result, cause, [result, from] , cause, [2 , rev] ) . 
semp (result, cause, [result, in] , cause, [def] ) . 
semp (resulted, cause, [resulted, from] , cause, [2, rev]) . 
semp (resulted, cause, [resulted, in] , cause, [def]) . 
semp (resulting, cause, [resulting, from] , cause , [2, rev]) . 
semp (resulting, cause , [resulting, in] , cause, [def] ) . 
semp (results, cause, [results, from] , cause, [2,rev]). 
semp (results, cause, [results, in] , cause, [def]). 
semp(set, release, [set, free], release , [def ] ) . 
semp(set, release, [set, free], release , [def ] ) . 
semp(sets, release, [sets, free], release , [def ] ) . 
semp (setting, release, [setting, free], release , [def ] ) . 
semp (suppress, inactivate, [suppress, activity, of], inactivate, [ 

semp (suppressed, inactivate, [suppressed, activity, of], inactivat 
e, [def] ) . = ^ _ . ^ __ . _ 

semp (suppresses, inactivate, [suppresses, activity, of], inactivat 
e, [def]). 

semp (suppression, inactivate, [suppression, of , activity, of], inac 
tivate, [def] ) . 

semp(switch, activate, [switch, on, the, activity, of], activate 
, [def] ) . 

semp (switched, activate, [switched, on, the, activity, of], acti 
vate, [def] ) . 

semp (switches, activate, [switches, on, the, activity, of], acti 
vate, [def] ) . 

semp (up, signal , [up, regulate] , signal, [2, rev]) . % A up-regul 
ates B B --> A 

semp (up, signal, [up, ' - ' , regulated] , signal, [2, rev] ) . 
semp (up, signal, [up, ' - ' , regulates] , signal, [2, rev] ) . 
semp (up, signal, [up, ' - ' , regulation] , signal, [2, rev] ) . 
semp (was, cause, [was , a, means , of , producing] , cause, [def]) . 
semp (was , cause , [was , due , to] , cause , [2 , rev] ) . 

semp (were, cause, [were , a , means , of , producing] , cause, [def] ) . 

semp (were , cause , [were , due , to] , cause , [2 , rev] ) . 

semw (acetylate, createbond, acetylate, [def] ) . 

semw (acetylated, createbond, acetylate, [def]) . 

semw (acetylates , createbond, acetylate, [def]) . 

semw (acetylation, createbond, acetylate, [def]) . 

semw (activate, activate, activate, [def] ) . 

semw (activated, activate, activate, [def]) . 

semw (activates, activate, activate, [def] ) . 
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semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




s emw 




semw 




-semw 




semw 


VI 


semw 


use 






semw 


% er 




rr s 


semw 


: s 
e ir 


semw 


V K 


semw 


H 


semw 






s s 


semw 




semw 


1 L 

F st 


semw 


as; 






semw 




semw 


£3 






semw 




semw 




semw 




semw 




bond 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 



activation, activate, activate, [def ] ) . 
add, attach, attach, [def] ) . 
added, attach, attach, [def] ) . 
addition, attach, attach, [def] ) . 
adds, attach, attach, [def]) . 

after, time, after, [2 , rev] ) . % temporal relations 
aggregate , attach, attach, [def]) . 
aggregated , attach, attach, [def] ) . 
aggregates, attach, attach, [def] ) . 
aggregation , attach, attach, [def] ) . 
arrest, inactivate, inactivate, [def]) . 
arrested, inactivate, inactivate, [def] ) . 
arrests, inactivate, inactivate, [def]) . 
associate, attach, attach, [def] ) . 
associated, attach, attach, [def]) . 
associates, attach, attach, [def ] ) . 
association, attach, attach, [def] ) . 
attach, attach, attach , [def] ) . 
attached , attach, attach, [def] ) . 
attaches, attach, attach, [def] ) . 
attachment, attach, attach, [def]) . 
bind, attach, attach, [def] ) . 
binding, attach, attach, [def] ) . 
binds , attach, attach, [def]) . 
block, inactivate, inactivate, [def]) . 
blocked, inactivate , inactivate, [def]) . 
blocking, inactivate , inactivate, [def]) . 
blocks, inactivate, inactivate, [def]) . 
bound, attach, attach, [def] ) . 
break, breakbond, 'break bond', [def]) . 
breakage, breakbond, 'break bond' , [def] ) . 
breaks, breakbond, 'break bond' , [def] ) . 
broke, breakbond, 'break bond' , [def] ) . 
broken, breakbond, 'break bond', [def]) . 



case without break 



catalyzation, promote , catalyze, [def] ) 
catalyze, promote, catalyze, [def]) . 
catalyzed, promote, catalyze, [def]) . 
catalyzes, promote, catalyze, [def] ) . 
catalyzing, promote, catalyze, [def] ) . 
cause, cause, cause, [def] ) . 
caused, cause, cause, [def] ) . 
causes, cause, cause, [def] ) . 
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semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 






" "til 


semw 


v. 3 £ 


semw 




semw 


IS; 


semw 




semw 


f LI 


semw 




semw 


s 


semw 


o 


semw 


zxzv. 


semw 


r 


semw 


f *l 


semw 


s r 


semw 




semw 




semw 




semw 




semw 




semw 




semw 




y? 




semw 




semw 




semw 




semw 




semw 




semw 



cleavage, breakbond, "break bond 1 , [def ] ) . 
cleave, breakbond, "break bond' , [def] ) . 
cleaved, breakbond, 'break bond' , [def] ) . 
cleaves, breakbond, 'break bond' , [def] ) . 
coimmunoprecipitate, attach, attach, [def]) . 
coimmunoprecipitated , attach, attach, [def]) . 
coimmunoprecipitates , attach, attach, [def]) . 
coimmunoprecipitation , attach, attach, [def]) . 
combination , attach, attach, [def] ) . 
combine , attach, attach, [def] ) . 
combined , attach, attach, [def] ) . 
combines, attach, attach, [def] ) . 
conjugate , attach, attach, [def] ) . 
conjugated , attach, attach, [def] ) . 
conjugates, attach, attach, [def] ) . 
conjugation , attach, attach, [def]') . 
connect , attach, attach, [def] ) . 
connected , attach; attach, [def ] ) . 
connection , attach, attach, [def] ) . 
connects, attach, attach, [def] ) . 
constrain, inactivate, inactivate, [def]) . 
constrained, inactivate, inactivate, [def]) . 
constrains, inactivate, inactivate, [def]) . 
constraint, inactivate, inactivate, [def] ) . 
coprecipitate, attach, attach, [def] ) . 
coprecipitated, attach, attach, [def] ) . 
coprecipitates, attach, attach, [def]) . 
coprecipitation , attach, attach, [def]) . 
copurif ication , attach, attach, [def]) . 
copurified , attach, attach, [def] ) . 
copurif ies, attach, attach, [def] ) . 
copurif y , attach, attach, [def]) . 
couple , attach, attach, [def]) . 
coupled, attach, attach, [def]) . 
couples, attach, attach, [def]) . 

cut, breakbond, 'break bond', [def]) . % leave breakbond onl 

cuts, breakbond, 'break bond' , [def] ) . 
deactivate, inactivate, inactivate, [def] ) . 
deactivated, inactivate, inactivate, [def] ) . 
deactivates, inactivate, inactivate, [def]) . 
deactivation, inactivate, inactivate, [def] ) . 
death, process, death, [1] ) . 
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rii 



semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
gument 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 



demethylate, breakbond, demethylate, [def ] ) . 
demethylated, breakbond, demethylate, [def]) . 
demethylates, breakbond, demethylate, [def]) . 
demethylation, breakbond, demethylate, [def] ) . 
dephosphorylate, breakbond, dephosphorylate, [def]) . 
dephosphorylated, breakbond, dephosphorylate , [def] ) . 
dephosphorylates, breakbond, dephosphorylate , [def] ) . 
dephosphorylation, breakbond, dephosphorylate , [def]) . 
die, process, death, [1] ) . 
died, process, death, [1] ) . 
dies, process, death, [1] ) . 
disassemble, release, release, [def]) . 
disassembled, release, release, [def]) . 
disassembles, release, release, [def]) . 
disassembly, release, release, [def]) . 
discharge, release, release, [def] ) . 
discharged, release, release, [def]) . 
discharges", release, release, [def] ) . 
disengage, release, release, [def] ) . 
disengaged, release, release, [def] ) . 
disengagement, release, release, [def]) . 
disengages, release, release, [def]) . 
divide, breakbond, 'break bond', [def]) . 
divided, breakbond, 'break bond' , [def] ) . 
divides, breakbond, 'break bond' , [def] ) . 
division, breakbond, 'break bond' , [def] ) . 
dying, process, death, [1] ) . 
enhance, promote, promote, [def] ) . 
enhanced, promote , promote , [def] ) . 
enhancement , promote, promote, [def] ) . 
enhances, promote, promote, [def]) . 
enhancing, promote, promote, [def]) . 

express, generate , express , [def]) . % can have either 1 or 2 ar 
s 

expressed, generate, express , [def] ) . 
expresses, generate , express , [def] ) . 
expressing, generate , express , [def] ) . 
expression, generate, express, [def] ) . 
generate, generate, generate, [def]) . 
generated, generate, generate, [def] ) . 
generates, generate, generate, [def] ) . 
generating, generate, generate, [def]) . 
generation, generate, generate, [def] ) . 
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lexsemact . pat . txt 



semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
-.semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 



hew, breakbond, 'break bond' , [def] ) . 
hewed, breakbond, 'break bond' , [def] ) . 
hews, breakbond, 'break bond' , [def] ) . 
hinder, inactivate, inactivate, [def] ) . 
hindered, inactivate, inactivate, [def]) . 
hinders, inactivate, inactivate, [def]) . 
hindrance, inactivate, inactivate, [def]) . 
inactivate, inactivate, inactivate, [def] ) . 
inactivated, inactivate, inactivate, [def]) . 
inactivates, inactivate, inactivate, [def] ) . 
inactivation, inactivate, inactivate, [def]) 
incite, activate, activate, [def]) . 
incited, activate, activate, [def] ) . 
incitement, activate, activate, [def]). 
incites, activate, activate, [def]) . 
induce, activate, activate, [def] ) . 
induced, activate, activate, [def]) . 
induces-, activate, activate, [def]) . 
induction, activate, activate, [def]) . 
influence, activate, activate, [def]) . 
influenced, activate, activate, [def] ) . 
influences, activate, activate, [def]) . 
influencing, activate, activate, [def]) . 
inhibit, inactivate, inactivate, [def] ) . 
inhibited, inactivate, inactivate, [def]) . 
inhibition, inactivate, inactivate, [def] ) . 
inhibits, inactivate, inactivate, [def]) . 
initiate, activate, activate, [def] ) . 
initiated, activate, activate, [def]) . 
initiates, activate, activate, [def]) . 
initiattion, activate, activate, [def] ) . 
instigate, activate, activate, [def]) . 
instigated, activate, activate, [def]) . 
instigates, activate, activate, [def]) . 
instigation, activate, activate, [def]) . 
interact, interact, interact, [def] ) . 
interacted, interact, interact, [def]) . 
interaction, interact, interact, [def]) . 
interactions, interact, interact, [def]) . 
interacts, react, interact, [def]) . 
join , attach, attach, [def]) . 
joined , attach, attach, [def] ) . 
joining, attach, attach, [def]) . 
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lexsemact . pat . txt 





semw 


(joins, attach, attach, [def ] ) . 




semw 


(juncture, attach, attach, [def]) . 




semw 


(liberate, release, release, [def] ) . 




semw 


(liberated, release, release, [def]) . 




semw 


(liberates, release, release, [def]) . 




semw 


(liberation, release, release, [def]). 




semw 


(limit, inactivate, inactivate, [def]) . 




semw 


(limitation, inactivate, inactivate, [def]) . 




semw 


(limited, inactivate, inactivate, [def] ) . 




semw 


(limits, inactivate, inactivate, [def] ) . 




semw 


(link, attach, attach, [def]) . 




semw 


(linked, attach, attach, [def]) . 




semw 


(linking, attach, attach, [def]) . 




semw 


(links , attach, attach, [def] ) . 




semw 


(mediate, promote, promote, [def] ) . 




semw 


(medxa-ted, promote, promote, [def] ) . 




semw 


(mediates, promote, promote, [def] ) . 




.. . semw 


(mediation, promote, promote, [def ] ) . 


i. c 


semw 


(methylate, createbond, methylate, [def]) . 


5 r = 


semw 


(methylated, createbond, methylate, [def] ) . 


. =3 


semw 


(methylates, createbond, methylate, [def] ) . 


til 


semw 


(methylation, createbond, methylate, [def] ) . 


K ■ $ 

3 


semw 


(modification, modify, modify, [def]) . 


V 2 


semw 


(modified, modify, modify, [def]) . 


« 


semw 


imodif ies , modify , modify , [def] ) . 




semw 


(modify, modify , modify, [def] ) . 


a sa 


semw 


(modifying, modify , modify, [def] ) . 


; : 

f zst 


semw 


(mutate, modify, mutate, [1] ) . 




semw 


(mutated, modify , mutate, [1]) . 




semw 


(mutates , modify , mutate , [1]) . 




semw 


(mutating, modify , mutate , [1] ) . 




semw 


(mutation, modify , mutate , [1] ) . 




semw 


(overexpressed, generate , overexpress , [def]) . 




semw 


(overexpresses, generate , overexpress , [def] ) . 




semw 


(overexpressing, generate , overexpress , [def] ) . 




semw 


(overexpress, generate, express, [def]) . 




semw 


(overexpression, generate, overexpress, [def]) . 




semw 


(pair , attach, attach, [def]) . 




semw 


(paired, attach, attach, [def] ) . 




semw 


(pairing, attach, attach, [def]) . 




semw 


(pairs, attach, attach, [def] ) . 




semw 


(phosphorylate, createbond, phosphorylate , [def]) . 




semw 


(phosphorylated, createbond, phosphorylate, [def]) . 
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lexsemact . pat . txt 



semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
A i 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 
semw 



phosphorylates, createbond, phosphorylate , [def ] ) . 
phosphorylation, createbond, phosphorylate, [def] ) 
precede, cause, cause, [def] ) . 
preceded, cause, cause, [def]). 
precedes, cause, cause, [def]). 
preceding, cause, cause, [def] ) . 
promote, promote, promote, [def]) . 
promoted, promote, promote, [def]) . 
promotes, promote, promote, [def] ) . 
promotion, promote, promote, [def] ) . 
prompt, activate, activate, [def]) . 
prompted, activate, activate, [def] ) . 
prompting, activate, activate, [def]) . 
prompts, activate, activate, [def]) . 
react, react, react, [def]) . 
reacted, react , react , [def] ) . 
reaction, react, react, [def] ) . 
reactions, react, react, [def] ) . 
reacts, react, react, [def] ) . 
regulate, signal, signal, [def]) . 
regulated, signal, signal, [def]) . 
. --> B 

regulates, signal, signal, [def]) . 
regulation, signal, signal, [def]) . 
release, release, release, [def] ) . 
released, release, release, [def]) . 
releases, release, release, [def]) . 
removal, breakbond, 'break bond ' , [def] ) . 
remove, breakbond, 'break bond ' , [def] ) . 
remove, breakbond, 'break bond ' , [def] ) . 
removes, breakbond, 'break bond ' , [def] ) . 
replace, substitute, substitute, [def]) . 
replaced, substitute, substitute, [def]) . 
replacement, substitute, substitute, [def]) 
replaces, substitute, substitute, [def] ) . 
repress, inactivate, inactivate, [def]) . 
repressed, inactivate, inactivate, [def]) . 
represses, inactivate, inactivate, [def]) . 
repression, inactivate, inactivate, [def] ) . 
require, cause, cause, [2, rev] ) . 
required, cause, cause, [2, rev] ) . 
requirement, cause, cause, [2, rev]) . 
requires, cause, cause , [2 , rev] ). 



% B is regulated by 
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lexsemact . pat . txt 





semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 


JIL . 


s ejnw^ 




semw 


Id 


semw 


ass 


semw 








semw 


m 


semw 




semw 




semw 


O 


semw 




semw 


r "~ 


semw 


n zz 






semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 




semw 



requiring, cause, cause, [2, rev] ). 
restrain, inactivate, inactivate, [def] ) . 
restrained, inactivate, inactivate, [def]) . 
restrains, inactivate, inactivate, [def]) . 
restraint, inactivate, inactivate, [def]) . 
sensitization, activate, activate, [def]) . 
sensitize, activate, activate, [def] ) . 
sensitized, activate, activate, [def] ) . 
sensitizes, activate, activate, [def] ) . 
separate, breakbond, 'break bond' , [def] ) . 
separated, breakbond, 'break bond', [def]) . 
separates, breakbond, 'break bond', [def]) . 
separation, breakbond, 'break bond', [def]) . 
sever, breakbond, 'break bond' , [def] ) . 
severance, breakbond, 'break bond', [def]) . 
severed, breakbond, 'break bond ', [def ]) . 
severs, breakbond, 'break bond' , [def] ) . 
signal, signal, signal, [def] ) . 
signaled, signal, signal, [def]) . 
signaling, signal, signal, [def] ) . 
signals, signal, signal, [def]) . 
split, breakbond, 'break bond' , [def] ) . 
splits, breakbond, 'break bond' , [def] ) . 
splitting, breakbond, 'break bond' , [def] ) . 
stimulate, activate, activate, [def]) . 
stimulated, activate, activate, [def] ) . 
stimulates, activate, activate, [def] ) . 
stimulation, activate, activate, [def] ) . 
substitute, substitute, substitute, [def]) . 
substituted, substitute, substitute, [def]) . 
substitutes, substitute, substitute, [def]) . 
substitution, substitute, substitute, [def]) 
suppress, inactivate, inactivate, [def]) . 
suppressed, inactivate, inactivate, [def]) . 
suppresses, inactivate, inactivate, [def]) . 
suppression, inactivate, inactivate, [def] ) . 
tie, attach, attach, [def] ) . 
tied, attach, attach, [def] ) . 
ties, attach, attach, [def] ) . 
transcribe, generate, transcribe, [def]) . 
transcribed, generate, transcribe, [def] ) . 
transcribes, generate, transcribe, [def] ) . 
transcribing, generate, transcribe, [def] ) . 
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lexsemact . pat . txt 



transcription, generate, transcribe, [def] ) . 

ubiquitinize, createbond, ubiquitinize , [def]). 

ubiquitinize, createbond, ubiquitinize, [def]) . 

ubiquitinized, createbond, ubiquitinize, [def]) 

ubiquitinizes, createbond, ubiquitinize, [def] ) 

urge, activate, activate, [def ]) . 

urge, activate, activate, [def] ) . 

urged, activate, activate, [def]) . 

urges, activate, activate, [def]) . 

urging, activate, activate, [def]) . 

form, attach, attach, [def] ) . 

forms, attach, attach, [def] ) . 

formed, attach, attach, [def] ) . 

forming, attach, attach, [def] ) . 

formation, attach, attach, [def] ) . 

assemble, attach, attach, [def] ) . 

assembles, attach, attach, [def]) . 

assembled, attach, attach, [def]) . 

assembling, attach, attach, [def] ) . 

assembly , attach, attach, [def]) . 

dissassemble, release, release, [def] ) . 

dissassembles, release, release, [def] ) . 

dissassembled, release, release, [def] ) . 

dissassembling, release, release, [def] ) . 

dissassembly, release, release, [def] ) . 

dissociate, release, release, [def] ) . 

dissociates, release, release, [def] ) . 

dissociated, release, release, [def] ) . 

dissociating, release, release, [def] ) . 

dissociation, release, release, [def] ) . 

recruit , attach, attach, [def]) . 

recruits , attach, attach, [def] ) . 

recruited, attach, attach, [def] ) . 

recruiting, attach, attach, [def] ) . 

recruitment , attach, attach, [def]) . 
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% edited Genome grammar - adapted from MedLEE' s grammar for use with MedLEE 

% this is to be used along with the genomics lexicon of substances, actions, 

% and relations . 

% revised March 16, April 5, 2000 

% adjusted for tagged input 

:- multif ile (wdef /3) . 

:- multif ile (phrase/5) . 

%%%%%%%%%%%%%%%%%%%% Semantic Grammar for Genomics %%%%%%%%%%%%%%%%%%%%%%%%%%%% 

% * 

% Written by Carol Friedman for the MedLEE System % 

% 

% Queens College of the City University of New York % 

% * 
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%^%^ %%%%%%%%%%%%% 

% Highest Level Predicate - sem_sent - 1st arg. is target structure % 
% - 2nd arg. is a list of words in sentence% 

% - 3rd arg. is ' [] ' % 

% Target structure: a frame or set of connected frames: % 

% the frame describes an action or several related actions; % 

% an action frame is a list consisting of the symbol 'action 1 '*^ % 

% followed by the code for the action and arguments. % 

% . The arguments are either, substances or actions; = _ - - . % 

O % each substance slot consists of the name of the type of % 

% substance followed by the value for the substance; % 

{j| % the substance slot may contain slots for several substances. % 

a ll % Examples: % 

k *% % Blocking of il-2 gene transcription by activated rapl . % 

f}l % [action, inactivate, [protein, Rapl , [state, active] ] , % 

*)t % [action, transcribe, [x] , [gene, interleukin-2] ] ] % 

ry % % 

% The adapter protein crkl was associated with both phosphorylated cbl and the% 
- % guanidine nucleotide-releasing factor c3g. % 

[3 % [action, attach, [protein, CrkL] , % 
e ~ % [relation, and, [protein, Cbl, [state, phosphorylated] ] , % 

L-j. % [protein, guanidine nucleotide-releasing factor C3G, 

% [state , phosphorylated] ] ] ] % 

%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%^% %%%%%%%%%%%%% 
% fail an unknown predicate 
unknown (_, fail) . 

op(900, fy, [not,once]). % same priority and type as \+ 
op(700, xfx, [\=,~=]). % same priority and type as = or == 

% snoop is generally used to find input string when using a DCG 
% the input string is used for constraints 

snoop (A, B, A, B) . 



sem_sent (P,$emlist , X) --> 

{assert (addstotal (0) ) } , 
sem_parse (P, Semlist , X) . 

sem_parse (Target , Semlist) --> 

semjpatterns (P, Semlist) . 

sem_j?arse (Target, Semlist, X) --> 
sem_patterns (P, Semlist) , 
sem_endornot (P, Target, X) . 



sem_j?arse ( [failure] X,_,_) :- 
addstotal (X) . 

sem_endornot (P, P,X) --> % P is target if there is an endmark 



sem_endmark, 

{addstotal (X) } . % X is number of times reached endmark 
sem_endornot (_,_,_,_,_) :- % did not reach endmark; update count and fail 

uptotal, fail. 
sem_endornot(_, [failure] ,X,_,_) :- 

addstotal (X) , % X is number of times reached 

X >= 50. 



% Finding patterns 

sem_patterns (F, Semlist) --> 
pattern(Fl / Semlist) , 

{Fl \= []}, % 1st finding should not be empty 

morepattern (R,F2, Semlist) , % connected patterns 
{getrelation(R,Fl,F2,F) } . 

y'i-i'A A i i kk kkrkk k k kk kr -k kr kr k-kkkkkkkkkkkkkkkkkkk k k iixxx Air k k -k k kk k k * 

* The action pattern types are: pattern, nounactionpatt , actpatt, and * 
* . nounactpatt . ______ . _ . ^ * 

* pattern --> actionarg (Al) * 

* active or passive verb * 

* actionarg (A2) . * 

* pattern --> nounactionpatt. * 

* pattern --> actpatt . * 

% pattern is saved in a symbol table (st) ; check for success/failure 1st 
% Case where pattern is in st and has been successful 
pattern (Fmt,_) --> checkst (pattern, _, s , Fmt) . 
% Case where pattern is in st as a failure, 
pattern (_,_) --> checkst (pattern. f ,_) , {!, fail}. 

% pattern 5 : an action pattern with a nominal verb 
% Psl cleavage by zvad. 

% apoptosis- induced cleavage of PS2 by zDEVD. 
pattern (F, Semlist) --> 
snoop (SO, SO) , 
{ \+ checkst (pattern, 5, SO, _) , 
actionchk (Semlist) } , 
nounactionpatt (F) , 
snoop ( S , S ) , 
{ addst (pattern, 5, s, F, SO, S) 

}• 

% pattern 1: an action/substance acts on an action/substance 

% the activation of rapl inhibits the expression of il-2 

% rapl functions as a negative regulator of tcr-mediated il-2 gene 

% transcription. 

pattern (F, Semlist) --> snoop (SO, SO) , % SO is the input string 
{ \+ checkst (pattern, 1,_,_, SO, _) , 
actionchk (Semlist) , 
connectchk (Semlist ) }, 
actionarg (Al) , 



3 



connectact (Sem, [v / vp,ved] , Target , Features) , 
actionarg (A2) , 

snoop(S,S), %ending sentence list 
{ member<def, Features), 

modlist ( [Al,A2,Site] ,Mods) ; 
member (rev, Features) , 
modlist ( [A2,Al,Site] ,Mods) ) , 
frame (F, action, Target, Mods) , 
addst (pattern, 1, s, F, SO, S) 

}. 

% pattern 2: an action/substance was acted on by an action/substance 
% The aggregation of bad was suppressed. 

% The aggregation of bad was suppressed by the phosphorylation of jnk. 
% Grb2 was associated with Cbl . 

% Apoptosis -associated cleavage of endogenous PS1 was blocked by the 
% treatment with zVAD. 
pattern (F, Semlist) - - > 

snoop (SO, SO) , % SO is the input string 

{ \t check st (pattern, 2 , , _ , 3 0 , _) , 

actionchk (Semlist) , 
connectchk (Semlist) } , 
actionarg (A2) , 
sem_beterm (_) , % was 

connectact (Sem, [ven] , Target , Features) , %activated 
optbyarg (Al) , 

snoop(S,S), %ending sentence list 
{ (member (def, Features), 

modlist ( [Al,A2,Site] ,Mods) ; 
member (rev, Features) , 
modlist ( [A2,Al,Site] ,Mods) ) , 
frame (F, action, Target, Mods) , 
addst (pattern, 2, s, F, SO, S) 

}• 

% pattern 3 : an action/substance acted on an action/substance 

% bad induced phosphorylation of fyn. 

% tcr and cd28-mediated il-2 transcription. 

pattern (F, Semlist) - -> 

snoop (SO, SO) , 
{ \+ checkst (pattern, 3,_,_,S0,_), 

actionchk (Semlist) , 

connectchk (Semlist) } , 

actionarg (Al) , % substance or basic action 
% optdash, 

connectacts (Sem, [vp,ven,ved] , Target , Features) , % Activated' 
% optof, 

actionarg (A2) , % had pattern here 
snoop (S, S) , 
{ (member (def, Features), 

modlist ( [Al,A2,Site] ,Mods) ; 
member (rev, Features) , 
modlist ( [A2,Al,Site] ,Mods) ) , 
frame (F, action, Target, Mods) , 
addst (pattern, 3, s, F, SO, S) 

}• 



% pattern 4: a simple action pattern with an active verb. 
% Activated Raf-1 phosphorylates MEK-1. 
pattern (F, Semlist) --> 
snoop (SO, SO) , 

%check that sentence has an action word/phrase 
{ \+ checkst (pattern, 4,_,_,S0,_), 

actionchk (Semlist) } , 

actpatt (F) , 

snoop (S, S) , 
{ addst (pattern, 4,s,F,S0,S) 

}• 

% no more patterns - save failure 

pattern (_,_) --> addst (pattern, 0, f,_) , {!, fail}. 

% sem_morepattern(-Rel, -P, +Semlist, +S0, +S) : 
% Rel is a relation and its value frame; 

% P is the remaining patterns, Semlist is the list of semantic classes 

% in sentence 

% if have a series of ','s, use the relation "and" or "or" if in the nest 

% and make that the^ relation 

morepattern (R, F, Semlist) --> 

sem_relation(Rl,Modl) , %relation and modifiers 

sem_pat terns (F, Semlist) , 

{( frame (F, rel , Conj2 , _) , % F contains nested relation 

(Conj2 = and; Conj2 = or), f rame (Rl, rel ,',',_) , % Rl relation frame 
frame (R, rel, Con j 2, _) % value of relation is Conj2 

Rl \= [] , % where do Type, Value and Mods2 come from? 
frame (Rl, Type, Value ,Mod2) , % get components of original relation 
mergemods (Modi , Mod2 , Mods ) , 
( Mods = [] , f rame (R, rel, Value, []) , !; 

%frame(R,rel, [Value | Mods] , [] ) % make it rel connector with rel mod 

R = [rel, [Value | Mods] ] 

) 

) 

}. 

% no more findings 
morepattern ( [],[],_, S , S) . 

% actionarg is the argument of pattern 

% actionarg is either a substance or a basic action 

% actionarg is saved in a symbol table (st) ; check for success/failure 1st 
% Case where actionarg is in st and have been successful 
actionarg(A) --> checkst (actionarg, _, s, A) . 
% Case where actionarg is in st as a failure, 
actionarg (_) --> checkst (actionarg, _, f,_) , {!, fail}. 

% actionarg 1 : a substance or substances 
% Rapl, active Rapl, Cbl and Crkl 

actionarg(A) --> snoop (SO , SO) , % SO is the input string 
{ \+ checkst (actionarg, 1,_,_, SO, _)} , 

substances (A) , 

snoop (S, S) , 
{ addst (actionarg, 1, s, A, SO, S) }. 



% actionarg 2: a process like apoptosis, or a disease 
actionarg(A) snoop (SO , SO) , % SO is the input string 

{ \+ checkst (actionarg, 2 SO, _) } , 
processpatt (A) , 
snoop (S, S) , 
{ addst (actionarg, 2 , s , A, SO , S) 

}• 

% actionarg 3 : a nominal action pattern 
% Etoposide- induced apoptosis. 
% Etoposide- induced PS1 cleavage by zVAD. 
actionarg(A) --> snoop (SO , SO) , % SO is the input string 
{ \+ checkst (actionarg, 3, SO, _) } , 

nounactionpatt (A) , 

snoop (S , S) , 

{addst (actionarg, 3, s, A, SO, S) 

}• 

% act i-ona-rg 4 : the object of the nominal action is ari actionaTg 
% Blocking of IL-2 Gene transcription by activated rapl . 
actionarg(A) --> snoop (SO , SO) , % SO is_ the input string 
{ \+ checkst (actionarg, 4 , SO , _) }, 
action (Sem, [n,ving] , Target , Features) , 
[of] , 

actionarg (Al) , 
optbyagent ( A2 ) , 
snoop ( S , S ) , 
{ (member (def, Features), 
modlist ( [Al, A2] ,Mods) ; 
member (rev, Features) , 
modlist ( [A2,A1] ,Mods) ) , 
frame (A, action, Target, Mods) , 
addst (actionarg, 4, s, A, SO, S) 

}■ 



% no more actionarg - save failure 

actionarg (_) --> addst (actionarg, 0 , f ,_) , {!, fail}. 

% nounactionpatt is a nominal action pattern which allows for left and right 
% modifiers 

% 11-2 gene transcription mediated by tcr and cd28 was inhibited by rapl. 

% Activated rapl functions as a negative regulator of tcr and cd- 2 8 -mediated 

il_2 transcription. 

% nounactionpatt is saved in a symbol table (st) ; check for success/failure 1st 
% Case where nounactionpatt is in st and has been successful 
nounactionpatt (A) --> checkst (nounactionpatt s, A) . 
% Case where nounaction patt is in st as a failure, 
nounactionpatt (_) --> checkst (nounactionpatt ,_, f,_) , {!, fail}. 

nounactionpatt (P) --> snoop (SO, SO) , % SO is the input string 

{ \+ checkst (nounactionpatt, 1 ,_,_/S0,_)}, 
actionlmod(L, Synl) , 
nounactionunit (A) , 
actionrmod(R, Syn2) , 




snoop (S, S) , 
{ (Synl = ved, append (R, [A] , RA) , 
append (L, RA, P) ; 
Synl = ving, append (R, [A] , RA) , 
L = [action, Verb, Object] , 
modlist(RA, Object, Mods), 
frame (P, action, Verb, Mods)), 
addst (nounactionpatt, 1, s, P, SO, S) } . 
% no more nounactionpatt - save failure 

nounactionpatt (_) --> addst (nounactionpatt , 0 , f ,_) , {!, fail}. 

% the central unit of the nounactionpatt is a nounactpatt or a process 
nounactionunit (A) --> nounactpatt (A) . 
nounactionunit (A) --> process (A) . 



% left modifiers of nounactpatt 
% Zvad- inhibited cleavage pf Psl 
actionlmod(L, ved) --> substances (S) , 

optdash, 

a c t i on { S em , [ ve d ] , Target , F e atu-r e s ) , 
{ frame(L, action, Target, [S] ) }. 

= % apoptosis^ induced cleavage "of ps2 
actionlmod(L, ved) --> process(S), 

optdash, 

action (Sem, [ved] , Target , Features ) , 
{ frame (L, action, Target, [S] ) }. 



% apoptosis causing cleavage of Psl by Zvad. 
% need to invert the order of nounactpatt and actionlmod 
actionlmod(L, ving) --> processobj ect (A) , % process or nounacpatt, 

action (Sem, [ving] , Target , Features) , 
{ frame (L, action, Target, A) }. 



actionlmod ([] ,_) --> [] . 



actionrmod(R, ved) --> action(Sem, [ved] , Target , Features) , 

byagent (A) , % may have to add ving to actionrmod 
{ frame (R, action, Sem, A) }. 
actionrmod ([] ,_) --> [] . 



% 

% actpatt parses a simple action between substances expressed by an active verb 
% 

% actpatt is saved in a symbol table (st) ; check for success/failure % % 1st 

% Case where actpatt is in st and has been successful 

actpatt(F) --> checkst (actpatt ,_, s, F) . 

% Case where actpatt is in st as a failure. 

actpatt (_) --> checkst (actpatt, _, f,_) , {!, fail}. 

% actpatt 1 : substance acts on substance 
% PDKl phosphorylates p70s6k at Thr229 
actpatt (F) --> 

snoop (SO, SO) , % SO is the input string 
{ \+ checkst (actpatt , 1 ,_/_/30,_)}, 



substances (Al) , 

sem_whichrel , % opt 'that' 

action (Semclass, [vp,ved] , Target , Features) , 

prepopt, % added prepopt to allow action 'to' and 'with' substance 
substances (A2) , 
siteinf o (Site) , 
snoop (S , S) , 
{ (member (def , Features) , 
modlist ( [Al,A2,Site] , Mods) ; 
member (rev, Features) , 
modlist ( [A2,Al,Site] , Mods) ) , 
frame (F, action, Target, Mods) , 
addst (actpatt , 1 , s, F, SO, S) 

}• 

% acpatt 2 : 

% Substance was bound by Substance 

% Substance was associated to substance. 

% F can give either first or second place to the second argument; 

a by agent gets first position; prepagent gets second. 
% Phosphorylated Fyn was associated with Cbl . 

actpatt (F) - - > 

snoop (SO, SO) , % SO is the input string 
{ \+ checkst (actpatt , 2 SO ,_)} , 
substances (Al) , 
sem_beterm (_) , 

action (Semclass, [ven] , Target , Features) , 
optbyorprepagent (Position, A2) , 
snoop (S,S) , 
{ (member (def , Features), 

(Position=second, modlist ( [Al,A2,Site] ,Mods) ; 
Posit ion= first, modlist ( [A2, Al, Site] ,Mods) ) ; 
member ( rev , Features ) , 

(Position=second, modlist ( [A2 , Al, Site] , Mods) ; 
Position= first, modlist ( [Al , A2 , Site] , Mods) )) , 
frame (F, act ion, Target, Mods) , 
addst (actpatt, 2 , s, F, SO, S) 

}• 

% no more actpatt - save failure 

actpatt (_) --> addst (actpatt, 0, f,_) , {!, fail}. 

% 

% nounactpatt parses a simple action between substances expressed by a nominal 

% verb 

% 

% nounactpatt is saved in a symbol table (st) ; check for success/failure 1st 
% Case where nounactpatt is in st and have been successful 
nounactpatt (Fmt) --> checkst (nounactpatt ,_, s, Fmt) . 
% Case where nounactpatt is in st as a failure, 
nounactpatt (_) --> checkst (nounactpatt ,_, f,_) , {!, fail}. 

% nounactpatt 1: 

% Jnk phosphorylation of Bad 

nounactpatt (F) --> 

snoop (SO, SO) , % SO is the input string 
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{ \+ checkst (nounactpatt , 1 ,_, _, SO, _) }, 
substances (Al) , 
{aminoacidtest (Al) } , 
optdash, 

action (Semclass, [n] , Target , Features) , 
of object <A2) , 
% siteinfo (Site) , 
snoop (S, S) , 
{ (member (def, Features), 

modlist ( [Al, A2, Site] , Mods) ; 

member (rev, Features) , 

modlist ( [A2,Al,Site] ,Mods) ) , 

frame (F, action, Target , Mods) , 

addst (nounactpatt, 1, s, F, SO, S) 

}• 

% nounactpatt 2 : the binding of substance and substance 
% association of Fyn and Cbl. 

% the reason for having this as a separate pattern is to 

% prevent ' Fyn and Cbl ' from .being parsed together as substances 

nounactpatt (F) --> 

snoop (SO, SO) , % SO is the input string 
{ ■= V+ checkst (nounactpatt , 2 , _, _, SO , _) } , 
action (attach, [ving,n] , Target , Features) , 
ofobjectl (Al) , 
andobject (A2) , 
% siteinfo (Site) , 

snoop ( S , S ) , 
{ modlist ( [A1,A2, Site] , Mods) , 
frame ( F , action , Target , Mods ) , 
addst (nounactpatt ,2,s,F,S0,S) 

}• 

% nounactpatt 3 : 

% The cleavage of protein by substance. 

% Association of phosphorylated Fyn with Cbl 

% Tyrosine phosphorylation of Cbl by kinase 

% optbyorprepagent determines the order of arguments; byagent is placed first 
% prepagent is placed second 

nounactpatt (F) --> 

snoop (SO , SO) , % SO is the input string 
{ \+ checkst (nounactpatt , 3 /_/_/S0,_)}, 
actionof (F) , 
snoop (S, S) , 
{ addst (nounactpatt , 3 , s,F,S0,S) }. 

actionof (F) 

siteinfo (Site) , 

action (Semclass, [ving,n] , Target , Features) , 
optof object (Al) , 
optbyorprepagent (Position, A2) , 
snoop (S, S) , 
{ (member(def, Features), 

(Position=second, modlist ( [Al,A2,Site] ,Mods) ; 

Position^ first, modlist ( [A2 , Al , Site] , Mods) ) ; 

member (rev, Features) , 



(Position=second / modlist ( [A2 / Al / Site] ,Mods) ; 
Position= first, modlist ( [Al, A2 , Site] , Mods) )) , 
frame (F, action, Target, Mods) 

}• 

% nounactpatt 4 : 

% Fyn association with Cbl . 

nounactpatt (F) --> 

snoop (SO, SO) , % SO is the input string 
{ \+ checkst (nounactpatt , 4 SO , _) }, 

substances (Al) , 

action (Semclass, [ving,n] , Target , Features) , 
withobject (A2) , 
% siteinfo (Site) , 
snoop ( S , S ) , 
{ modlist ( [Al,A2,Site] ,Mods) , 
frame (Faction, Target, Mods) , 
addst (nounactpatt, 4 , s, F, SO, S) 

}• 

aminoacidtest (X) :- X \= [aminoacid|_] . 

% nounactpatt 5 : " ' 

% IL-2 gene transcription 

% Cbl phosphorylation [by substance or action] 
nounactpatt (F) --> 

snoop (SO, SO) , % SO is the input string 
{ \+ checkst (nounactpatt , 5 /_/_,S0,_) }, 

substances (A2) , 

optdash, 

action (Semclass, [n] , Target , Features) , 

optbyagent (Al) , 
% siteinfo (Site) , 

snoop ( S , S ) , 
{ (member (def, Features), 

modlist ( [A1,A2, Site] ,Mods) ; 

member (rev, Features) , 

modlist ( [A2,Al,Site] ,Mods) ) , 

frame ( F , action , Target , Mods ) , 

addst (nounactpatt , 5 ,s,F,S0,S) 

}• 

% nounactpatt 6 : 

% fyn-cbl association. 

nounactpatt (F) --> 

snoop (SO, SO) , % SO is the input string 
{ \+ checkst (nounactpatt , 6 ,_,_,S0,_) }, 

substances (Al) , 

optdash, 

substances (A2) , 

action (Semclass, [n,ving] , Target , Features) , 
% siteinfo(Site) , 
snoop (S, S) , 
{ modlist ( [A1,A2, Site] , Mods) , 
frame (F, action, Target, Mods) , 
addst (nounactpatt, 6 , s , F, SO , S) 

}. 
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% nounactpatt 7 : 

% Cbl phosphorylated by fyn. 

nounactpatt (F) --> 

snoop (SO, SO) , % SO is the input string 
{ \+ checkst (nounactpatt , 7 ,_,_/S0,_)}, 
substances (Al) , 

action (Semclass, [ven] , Target , Features) , 
[by] , 

substances (A2) , 
% siteinf o (Site) , 

snoop (S, S) , 
% { (member (def, Features), 

{ modlist ( [A2,A1, Site] , Mods) , 
% member (rev, Features) , 

% modlist ( [Al,A2,Site] ,Mods) ) , 

f rame (F, action, Target , Mods) , 
addst (nounactpatt, 7, s, F, SO, S) 

}• 

% no more nounactpatt - save failure 

nounactpatt (_) --> addst (nounactpatt, 0, f,_) , {!, fail}. 



connectact (Sem, Syn, Target , Features) --> 
action (Sem, Syn, Target , Features) , 

{member (Sem, [cause , causel , activate , inactivate , signal , substitute , promote] ) } . 

connectacts (Sem, Syn, Target, Features) --> 

connectact (Sem, Syn, Target , Features) . 

% aminoacid like tyrosine : ex.: tyrosine Cbl phosphorylation 
% at position 201 Thr 
siteinfo(S) --> aminoacid (A) , 

{frame (S, site, [A] , [] ) } . 

siteinfo(S) --> 

sitepreps, % 'in', 'at 1 
position (S) . 
siteinfo( [] ) --> [] . 
sitepreps --> prepterm (in, _) . 
sitepreps --> prepterm (at ,_) . 
position(S) --> [position] , 

sem_integerterm (I) , 
{ frame (S, site, I, [] ) } . 



% The definitions of actions refer to the lexicons lexsynact.pl and lexsemact.pl 
% Sem is the semantic class; Syn is the syntactic class 
% F is the target 

% oneaction was added for use with moreaction to allow parsing of conjoined 
% actions 

oneaction (activate, Syn, F, Features) --> activateterm (Syn, F, Features) , { !} . 
oneaction (attach, Syn, F, Features) --> attachterm (Syn, F, Features) , { ! } . 

oneaction (breakbond, Syn, F, Features) --> breakbondterm (Syn, F, Features) , {!} . 



II 



oneaction (createbond, Syn, F, Features) 
oneact ion (inactivate, Syn, F, Features) 
oneaction (react , Syn, F, Features) 
oneaction (release, Syn, F, Features) 
oneaction (signal, Syn, F, Features) 
oneaction (substitute, Syn, F, Features) 
oneaction (transcribe, Syn, F, Features) 
oneaction (promote, Syn, F, Features) 
oneaction (generate, Syn, F, Features) 
oneaction (cause, Syn, F, Features) - -> 



-> createbond term (Syn, F, Features) , { ! } 
-> inactivateterm (Syn, F, Features) , { ! } 
-> reactterm(Syn, F, Features) ,{!} . 
--> releaseterm(Syn, F, Features) , { ! } . 
-> signal term (Syn, F, Features) , { ! } . 
-> substituteterm (Syn, F, Features) , { ! } 
-> transcribeterm (Syn, F, Features) , { ! } 
-> promote term (Syn, F, Features) , { ! } . 
-> generateterm (Syn, F, Features) , { ! } . 
causeterm (Syn, F, Features) , { ! } . 



action (activate, Syn, F, Features) --> activateterm (Syn, Al, Features) , 

moreaction(Conj , Args) , 
{Conj = [] ,F =A1; 

Conj\= [] , mergemods ( [ [action,Al] ] , Args, Actions) , 
frame (Fl, relation, Conj , Actions) , F= [Fl] } . 
action (attach, Syn, F, Features) --> attachterm (Syn, Al ,Features), 

moreact ion (Conj , Args) , 
{Conj = [] ,F -Al/ 

Con_j \ = [ ] f mergemods ( [ [act ion , Al ] ] , Args , Actions ) , 
frame (Fl, relation, Conj , Actions) , F = [Fl] } . 
action (breakbond, Syn, F, Features) -- > breakbondterm( Syn, F, Features) , _ 
--=-■= " more act: ion (Conj /Args) , 
{Conj = [] ,F =A1; 

Conj\= [] , mergemods ( [ [action, Al] ] , Args , Actions) , 
frame (Fl, relation, Conj , Actions) , F = [Fl] } . 
action (createbond, Syn, F, Features) --> createbondterm (Syn, F, Features) , 

moreact ion (Conj ,Args) , 
{Conj = [] ,F =A1; 

Conj\= [] , mergemods ( [ [action, Al] ] , Args , Actions) , 
frame (Fl, relation, Conj , Actions) , F = [Fl] } . 
action (inactivate, Syn, F, Features) --> inactivateterm (Syn, F, Features) , 

moreact ion (Conj , Args) , 
{Conj = [] ,F =A1; 

Conj\= [] , mergemods { [ [action, Al] ] , Args , Actions) , 
frame (Fl, relation, Conj , Actions) , F = [Fl] } . 
action (react, Syn, F, Features) --> reactterm (Syn, F, Features) , 

moreact ion (Conj ,Args) , 
{Conj = [] ,F =A1; 

Conj\=[] , mergemods ([ [action, Al] ] , Args , Actions) , 
frame (Fl, relation, Conj , Actions) , F = [Fl] } . • 
action (release, Syn, F, Features) --> releaseterm (Syn, F, Features) , 

moreact ion ( Conj , Args) , 
{Conj = [] ,F =A1; 

Conj\=[] , mergemods ([ [action, Al] ] , Args , Actions) , 
frame (Fl, relation, Conj , Actions) , F= [Fl] } . 
action (signal, Syn, F, Features) signalterm (Syn, F, Features) , 

moreaction (Conj , Args) , 
{Conj = [] ,F =A1; 

Conj\= [] , mergemods ( [ [action, Al] ] , Args , Actions) , 
frame (Fl, relation, Conj , Actions) , F= [Fl] } . 
action (substitute, Syn, F, Features) --> substituteterm (Syn, F, Features) , 

moreaction (Conj ,Args) , 
{Conj - [] ,F =A1; 

Conj\=[] , mergemods ( [ [action, Al] ] , Args , Actions) , 
frame (Fl, relation, Conj , Actions) , F= [Fl] } . 
action (transcribe, Syn, F, Features) --> transcribeterm (Syn, F, Features) , 
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moreaction (Conj , Args) , 
{Conj = [] ,F =A1; 

Conj\= [] , mergemods ( [ [actional] ] , Args , Actions) , 
frame (Fl, relation, Conj , Actions) , F= [Fl] } . 
action (promote, Syn, F, Features) --> promoteterm <Syn, F, Features) , 

moreaction (Conj , Args) , 
{Conj = [] ,F =A1; 

Conj\=[] , mergemods ( [ [action, Al] ] , Args, Actions) , 
frame (Fl, relation, Conj , Actions) , F= [Fl] } . 
action (generate, Syn, F, Features) --> generateterm (Syn, F, Features) , 

moreaction (Conj , Args) , 
{Conj = [] ,F =A1; 

Conj\= [] , mergemods ( [ [action, Al] ] , Args, Actions) , 
frame (Fl, relation, Conj , Actions) , F= [Fl] } . 
action (cause, Syn, F, Features) --> cause term (Syn, F, Features) , 

moreaction (Conj , Args) , 
{Conj = [] ,F =A1; 

Conj\= [] , mergemods ( [ [action, Al] ] , Args, Actions) , 
frame (Fl, relation, Conj , Actions) , F= [Fl] } . 

% binds, phosphorylates and activates 
moreaction (Conj , Args) --> sem_conj rest (Conj 1) , 

- - — oneaction (Sem, Syn, A, Features) , 
moreaction (Conj 2 ,Alist) , 

{Conj2 = [] , Alist=[] ,Conj=Conjl, Args = [[action, A]] 
Conj 2 \= [] , Conj = Conj 2, 
addmod ( [action, A] , Alist , Args) } . 

moreaction ( [] , [] ,S,S) . 



passiveconnect (Sem, [ven] , Target , Features) --> 
sem_beterm (_) , 

connec tact (Sem, [ven] , Target , Features) . 



processpatt (A) --> disease (A) . 
processpatt (A) --> process (A). 



optbyorprepagent (f irst, A) --> byagent (A) . 
optbyorprepagent (second , A) - - > prepagent (A) 
optbyorprepagent (first , A) --> [] , {A = x} . 

byorprepagent (f irst , A) --> byagent (A) . 
byorprepagent (second, A) --> prepagent (A) . 

optbyagent (A) --> byagent (A) . 
optbyagent (A) --> [] , {A = [x] } . 

byagent (A) - - > [by] , 

substances (A) . 
byagent (A) --> [by], 

nounactionpatt (A) . 
prepagent (A) --> withobject (A) . 
prepagent (A) --> toobject(A). 
% prepagent (A) --> andobject (A) . 
prepagent (A) --> of object (A). 
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% optprepagent (A) - - > byagent (A) . 
optprepagent (A) --> of object (A), 
optprepagent (A) --> withobject (A) . 
optprepagent (A) --> toobject(A). 
optprepagent (A) --> andobject (A) . 
optprepagent (A) --> [] , {A= [x] } . 

ofobject(A) --> [of], 

nounactionpatt (A) . 
ofobject(A) --> [of], 

substances (A) . 
ofobject(A) --> [of], 

actionof (A) . 
of obj ectl (A) - - > [of] , substance (A) . 
optof object (A) --> ofobject(A). 
optof object ( [x] ) --> [] . 



% to parse Binding of Fyn and Bad 



processobject (A) --> process (A) . % can be expanded to nounactpatt, etc 



% opt withobject (A) --> withobject (A) . 
% optwithobject (A) --> [] , {A = [x] } . 
withobj ect (A) - — > [with] , substances (A) . 
toobject(A) --> [to], substances (A) . 
andobject (A) --> [and], substances (A) . 
prepobject (A) --> [to] , substances (A) . 
prepobject (A) --> [with], substances (A) . 



optbyarg(A) --> [by], 

actionarg (A) . 
optbyarg(A) --> substances (A) . 

optbyarg(A) --> [] , {A = ['substance unknown']}. 



prepopt --> [to] . 

prepopt --> [with] . 

prepopt --> [by] . 

prepopt --> [of] . 

prepopt --> [] . 



% toopt 

toopt --> [to] . 
toopt --> [] . 
% withopt 

withopt - -> [with] 
withopt --> [] . 



optdash --> ['-']. 

optdash --> [ ] . 

optof --> [of] . 

optof --> [ ] . 

/* optactionarg (A) --> actionarg (A) 

optactionarg ( [] ) --> [] . */ 



optactionarg (A) --> 
actionarg (A) . 



7? 



% there is no further argument 
optactionarg (A) --> 
[] , 

{A = [] }. 

% substances (F) --> substance (F) . 

% substances (F) --> substance (PI) , 

% moresubstances (Conj , Plist) , 

% { Conj = [] , Plist = [] , F = PI 

% Conj \= [] , 

% mergemods (PI , Plist , Args) , 

% f rame (F, relation, Conj , Args) 

% }• 

% substances (F) --> substanceswithmods (F) . 

% substances (A) --> 

% proteins (A) . 

% subswithmods . txt 



% substances is saved in a symbol table (st) ; 
% check for success/failure 1st 

% Case where substances is in st and has been successful 
substances (Fmt) --> checkst (substances, s, Fmt) . 
% Case where substance is in st as a failure", 
substances (_) --> checkst (substances , f,_) , {!, fail}. 

substances (F) - - > 

snoop (SO, SO) , 
{ \+ checkst (substances, 1, s,_, SO, _)} , 
lmods (Lmods) , % left modifiers 

(severalsubstances ( [relation, Conj , First | Rest] ) , % conjoined substances 

rmods (Rmods) , % right modifiers 

% create list of lists containing distributed mods, of substances 

{ distributesubs (Dist, [First | Rest] , Lmods , Rmods) , 
% check Lmods - "no" Fl or F2 should be changed to no Fl and no F2 

f ixconj (Lmods , [rel , Conj ] , [rel , C2] ) , 
%splice ( [Conj , Dist] , F) 

frame (F, relation, C2 , Dist) } ; 
% substances and modifiers without conjunction 

substance (Dl) , 

rmods (Rmods) , 

{Dl = [Typel, Substancel |ModsDl] , 
delete (ModsDl, [] , ModsD2) , 
append ( [Lmods, Rmods] , ModsD2 , Al lmods 1) , 
delete (Allmodsl, [] , Allmods2) , 
frame (F, Typel, Substancel, Allmods2) }) , 
snoop (S, S) , 
{ adds t (substances, 1, s, F, SO, S) } . 

/* substances (F) --> snoop (SO , SO) , 

{\+ checkst (substances, 3 /S,_,S0,_)}, 

complex (F) , 
{addst (substances, 3, s,F, SO, S) } . 

*/ 

% no more substances- save failure 

substances ( ) --> addst (substances, 0, f,_) , {!, fail}. 
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severalsubstances (F) --> 



substance (PI) , 
moresubstances (Conj , Plist) , 
Conj = [] , Plist = [] , F = 
Conj \= [] , 

addmod (Pi, Plist, Args) , 
frame (F, relation, Conj , Args) 



PI 



% ' X, Y, and Z' 
moresubstances (Conj , 



Args) --> sem_conj rest (Conj 1) , 
substance (PI) , 

moresubstances (Conj 2 , Plist) , 
{ Conj2 = [] , Plist = [] , Conj = 
Conj 2 \= [] , Conj2\= /, Conj 
addmod (PI, Plist , Args) 

}• 



Conj 1 , Args 
= Conj 2, 



[PI] 



% to allow for substances with modifiers 
moresubstances (Conj 1, Args) --> sem_conj rest (Conj 1) , 

substances (Args) , { ! } . 



moresubstances ([],[] ) --> []. % no conjunction 



% distributesubs 

% distributes left mods and right mods over list of findings creating 
% list of lists of findings with mods 
distributesubs ([],[] ,_,_) :- !. 
distributesubs (Dist, [Dl|Tail] , Lmods , Rmods ) :- 

distributesubs (Dist2, Tail, Lmods, Rmods) , %distributed for remainder 

Dl = [Typel, Substancel |ModsDl] , 

append ( [Lmods, Rmods] , ModsDl ,Al lmods 1) , 

delete (Allmodsl, [] ,Allmods2) , 

frame (D, Typel, Substancel, Allmods2) , 

append ( [D] ,Dist2, Dist) . % Combine findings to get list of findings 

lmods(A) --> stateterm(F) , 

{frame (A, state, F, [] ) } . 
lmods ( [] ) - - > sem_measure (_) . 
lmods ([]) --> [] . 
rmods ( [] ) --> [] . 

stateterm(F) --> acclex (state , F) . 

% for past participle of createbond and breakbond actions, the target 
% is the word, ex . : . phosphorylated, dephosphorylated, methylated 
stateterm(F) 

snoop (SO, SO) , % get the initial string 
createbondterm( [ven] , _,_) , 

{SO = [F|_]}. %get the first word of the string 
stateterm(F) --> 

snoop(S0,S0) , % get the initial string 
breakbondterm( [ven] , _,_) , 

{SO = [F|_]}. %get the first word of the string 
% may have to add attachterm for 'bound' 



% Taken from MedLEE grammar to handle '3 cm' 
sem_measure (M) --> 

sem_j?remeasure , 
sem_quantityterm(N) , 
optdash, 

sem_measureterm(Unit) , 
{ f rame (M, measure, [N, Unit] ,[] ) }. 
% complex predicates added November 8, 1999 
% CrkL-C3G complex 
% ras: raf-1 association 
% ras: raf-1 complexes 
% shc-grb2-sos 
% TCR/CD3 complex 

% p/CAF-p/CIP-CBP/p300-SRC-l complex 
% Ras: Raf-1 complexes 
complex(C) --> proteins(P), 

{P = [A,B|_] ,A \= [] , B \= [] }, 
optcomplexword , 
{ frame (C, complex, [P] , [] ) } . 

% a complex of NFAT4 with calcineurin 
complex ( C ) --> complexword, . 

complexarg (A) , 

{frame (C, complex, [A] , [] ) } . 

complexarg (A) --> [of], proteins (A) . 

complexarg (A) --> [between], proteins (A) . 

% a complex between MyD88, IRAK-2, and the IL-IRs 

complexarg (A) --> action (contain) , proteins (A) . 

% Complexes containing BOB.l/OBF.l and Oct proteins 

proteins(P) --> protein (A) , 

moreproteins (PI) , 

{(A\=[] ; append ( [A] ,P1,P) ) } . 

moreproteins (A) --> proteinconnector, 

proteins (A) . 



moreproteins ( [] ) -- 
proteinconnector 
proteinconnector 
proteinconnector 
% connector --> 
% connector --> 
proteinconnector (C) 
optconnector - - > 
optconnector --> 



> [] . 

-> ['-']. 

['/']• 
-> [':■]. 

[',']. taken out not to conflict with relation in 
[and] . moresubstances 
--> [with] . 
proteinconnector . 
[] . 



complexword 
complexword 
complexword 



[complex] . 
[complexes] . 
['signaling complexes'] 



optcomplexword 
optcomplexword 



-> complexword. 
■> [] - 



substance (A) 



- -> protein (A) . 



substance (A) 
substance (A) 
substance (A) 
substance (A) 
substance (A) 
substance (A) 
substance (A) 
substance (A) 
substance (A) 
substance (A) 
substance (A) 
substance (A) 



■> cell (A) . 
•> species (A) . 
■> structure (A) . 
• > domain (A) . 

■ > gene (A) . 

-> geneorprotein (A) 
-> aminoacid (A) . 
■> small molecule (A) 
•> matter (A) . 

> proteinsite (A) . 

■ > disease (A) . 

> complex (A) . 



% this will be modified later 



protein (A) --> 

proteinterm (P) , 

{frame (A, protein, P, [] ) } . 

complex (A) --> 

complexterm (P) , 

{frame (A, complex, P, {] ) } . 

cell (A) --> 

cellterm(P) , 

{frame (A, cell, P, [] ) } . 

species (A) --> 

speciesterm (P) , 

{frame (A, species, P, [] ) } . 

structure (A) --> 

structureterm(P) , 

{frame (A, structure, P, [] ) } . 

domain (A) --> 

domainterm (P) , 

{frame (A, domain, P, [] ) } . 

gene (A) --> 

geneterm(P) , 

{frame (A, gene, P, [] ) } . 



geneorprotein (A) - - > 
gpterm(P) , 
[X] , 

{ (X = gene, frame(A, gene, P, [] ) ; 

X = protein, frame (A, protein, P, [] ) ; 

X\= gene, X \= protein, frame (A, geneorprotein, P, []))}. 



aminoacid (A) --> 

aminoacidterm(P) , 

{frame (A, aminoacid, P, [] ) } . 



smallmolecule (A) --> 

smallmoleculeterm (P) , 

{frame (A, ' small molecule ' , P, [] ) } . 



matter (A) --> 



/6 



matterterm (P) , 

{frame (A, substance, P, [] ) } . 

proteinsite (A) - - > 

proteinsiteterm(P) , 

{frame (A, 'protein site ' , P, [] ) } . 

disease (A) --> 

diseaseterm(P) , 
{frame (A, disease, P, [] ) } . 
process (A) --> 

processterm (Syn, F, Features) , 
{frame (A, process, F, []),!} . 
process (A) --> 

processterm (P) , 

{frame (A, process, P, [] ) , ! } . 



% terminals 

prot e in t ern i ( F ) - - > a cc lex 

complexterm(F) --> acclex 
cellterm(F) = _ _ --> acciex 

speciesterm (F) --> acclex 

structureterm (F) --> acclex 

domainterm(F) --> acclex 

geneterm(F) --> acclex 

gpterm(F) --> acclex 

aminoacidterm (F) --> acclex 
smallmoleculeterm(F) --> acclex 

matterterm (F) --> acclex 

proteinsiteterm (F) --> acclex 

diseaseterm (F) --> acclex 

processterm (F) --> acclex 



vprotem/rj . 
(complex, F) . 
(cell,F) . 
(species, F) . 
(structure, F) . 
(domain, F) . 
(gene, F) . 
(gp,F) . 

(aminoacid, F) . 
(smallmolecule, F) 
(substance , F) . 
(proteinsite , F) . 
(disease, F) . 
(process, F) . 



% action (activate, Syn, F, Features) 



activateterm(Syn, F, Features) 
attachterm(Syn, F, Features) 
breakbondt erm ( Syn , F , Features ) 
createbondterm (Syn, F, Features) 
inactivateterm(Syn, F, Features) 
reactterm (Syn, F, Features) 
releaseterm (Syn, F, Features) 
signalterm(Syn, F, Features) 
substituteterm(Syn, F, Features) 
transcribeterm (Syn, F, Features) 
promo teterm ( Syn , F , Features ) 
processterm (Syn, F, Features) 
generateterm (Syn, F, Features) 
cause term (Syn, F, Features) 



- > 

- > 

- > 

- > 

- > 

- > 

- > 

- > 

- > 

- > 

- > 

- > 

- > 

- > 



--> activateterm (Syn, F, Features) . 

acclexss (activate, Syn, F, Features) . 
acclexss (attach, Syn, F, Features) . 
acclexss (breakbond, Syn, F, Features) . 
acclexss (createbond, Syn, F, Features) 
acclexss ( inactivate , Syn , F , Features ) 
acclexss (react, Syn, F, Features) . 
acclexss (release, Syn, F, Features) . 
acclexss (signal, Syn, F, Features) . 
acclexss ( substitute , Syn , F , Features ) 
acclexss (transcribe, Syn, F, Features) 

acclexss (promote, Syn, Features) . 
acclexss (process, Syn, F, Features), 
acclexss (generate, Syn, F, Features) . 
acclexss (cause, Syn, F, Features) . 



% Semlist contains a phrase which is an action 
actionchk (Semlist ) :- 

intersect (Semlist, [attach, cause, createbond, breakbond, activate, 

inactivate , substitute , transcribe , express , promote , s ignal] 



% Semlist contains a phrase which is a connector action 



connectchk (Semlist ) :- 

intersect ( Semlist , [cause , activate , inactivate , substitute , 

promote, signal] ) . 



%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%^^%%% %%%% 
% Genome sectionc: ends here 

%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%^%^%%^^^ %%%%%%% 
% relations are connected by conjunctions, or 
% certain "conn* prepositions. 

% Taken from MedLEE grammar to handle connectives that are conjunctions 
% Ex: "severe markings, possibly from tuberculosis" 

sem_relation(F, [] ) % relation and modifiers 

sem_commapunc , 

sem_certainty ( [] , C,rel) , 

prepterm(P, conn) , 

{frame (F, rel , P, C) } . 

%plice( [[rel,P] , C] ,R) . 

% Ex: "markings, swelling", "markings and swelling" 

sem_relation(R, □ ) - -_>_ sem_conjjrel (R^, 

sem_commapunc . 
% "density may represent known tumor" 

% "markings, and swelling" 
sem_conjrel (F) --> 

sem__commapunc , 

sem_conj term (Con j ) , 

{frame (F, rel, Conj ,[])}. 

sem_conjrest (Conj ) --> % restricted conj, has not sem_relation_showopt 

sem_commapunc , 
sem_conj term (Conj ) . 
% "markings , swelling" 
sem_conjrest ( ' , 1 ) --> 
snoop (SO , SO) , 

sem_commapunc , 
snoop ( S , S ) , 
{SO \= S}. 

% Treatment of Verbs from MedLEE 's Grammar 

% form of "be" 

sem_auxverb (B) --> sem_beterm (B) . 

% form of "do" 

sem_auxverb (B) --> sem_doterm (B) . 

% form of "have" 

sem_auxverb (B) --> sem_haveterm (B) . 

sem_recrel --> prepterm(in,_) . 
sem_recrel --> prepterm(to,_) . 
% "is not" 

sem_auxrel (V) sem_auxverb (_) , 

sem_negterm(V) . 
sem_auxrel (V) --> sem_auxverb (V) . 

% left modifiers of findings include negation, quantity, certainty, degree, s 
% change type modifiers 
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sem__integer (W) - - > [W] , { integer (W) } . 
sem_integer (W) --> integerterm (W) . 
sem_timeunit (T) --> sem_timeunitterm(T) . 

% From MedLEE grammar - "lasting 2 days", "for 2 day 
sem_duration (F) --> 

sem_durpreps , 

sem_premeasure, %about 

sem_timemeasure (T) , 

sem_durationmod, % opt. - "in duration" 
{frame (F, duration, [T] , [] ) } . 
sem_duration ( [] , S, S) . 

sem_durpreps --> [times] . 
sem_durpreps - - > 

prepterm(for,_) . 
sem_durpreps --> [lasting, for] . 
sem_durpreps --> [lasting] . 
s em durp r ep s — > [ las t e d , f o r ] . 
sem_durpreps --> [lasted]. 
sem_durationmod --> = 

sem_aposts, %opt . - n, s" 
[duration] . 
sem_durationmod --> [in] , [duration] . 
sem_durationmod --> [] . 
sem_aposts --> [ ,,,, ] / [s] . 
sem_apost --> [] . 

% sem_f requency taken From MedLEE ' s grammar 

% "two times", "times two", "two times a/per week", 

sem_f requency (F) - - > 

sem_f reqterm(Fl) , % "once" 

sem_f reqterm(F2) , % "a day" 

{frame (M, unitval , [Fl, F2] , [] ) , 
f rame (F, frequency, [M] , [] ) } . 

sem_f requency (F) --> 

sem_f reqterm (M) , % "qid", "daily" 
{frame (F, f requency, M, [] ) } . 

% "2 times", 

sem_f requency (F) --> 

sem_j?remeasure , 

sem_quantityterm (M) , 

sern_ times, 
{frame (F, frequency, [M] , [] ) } . 

% "times 2" 
sem_f requency (Q) --> 
sem_ times, 

sem_quantityterm (Ql) , 
{frame (Q, frequency, Ql , [] ) } . 
sem_f requency (F) --> 

[q] , sem_quantityterm(Q) , 

sem_timeunit (T) , 
{frame (F, frequency, [unitval, [Q, T] ],[])} . 
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sem_f requency (F) --> sem_eachevery , 

sem_quantityterm(Q) , 
sem_timeunit (T) , 
{frame (F, frequency, [unitval, [Q, T, every] ] , [] ) } . 
sem_f requency (Q) --> % "second" 
sem_ordinal (0) , 
sem_timeopt , 

{ frame (Q, frequency, O, [] ) } . 
sem_f requency ( [] ,S,S) . 
sem_timeopt --> [time] . 
sem_timeopt --> [] . 
sem_eachevery --> [each] . 
sem_eachevery --> [every] . 
sem_times- -> [times] . 
sem times- -> [x] . 



% Taken from MedLrEE : s grammar 

negation modifier - "no" as in "no cardiomegaly" 
sem_negation (F) _--> _ _.. . 

sem__negterm (N) , 
{frame (F,neg,N, [] ) } . 
% negation not present 
sem_negation ( [] ,S0,S0) . 

% Taken from MedLEE * s grammar 

% quantity modifier - "two" as in "two masses" 
sem_quantity (F) --> 
snoop (SO, SO) , 

{ \+ checkst (sem_dates,l,s,_,SO,_) }, % not a legitimate date 
sem_quantityterm (Q) , 

sem_quantityrmod(_) , % "2 or 3", "2 to 3" 

{\+ next_wordunit (SO) , % rule out '2 mm' 
f rame (F, quantity , Q, [] ) 

}- 

sem_quantity ( [] ,S0,S0) . 



sem_commapunc ( [ ■ , ' | S] , S) . 
sem__commapunc (S , S) . 

sem_conj term (C) --> acclex (conj , C) . 

sem_doterm (D) --> acclex (vdo, D) . 

sem_endmark ( [ . | S] , S) . 
sem_endmark ( [ ; j S] , S) . 

sem_f reqterm (F) --> acclex (freq, F) . 

sem_haveterm (H) --> acclex (vhave, H) . 

integerterm(I) --> acclex (integer , I) . 

sem_measureterm (M) --> acclex (unit, M) . 
sem_medterm (M) --> acclex (med, M) . 

sem_negterm(N) --> acclex (neg, N) . 

prepterm(P,C) --> acclex (p, [P, C] ) . 

sem timeunitterm(T) --> acclex (timeunit,T) 



% lexog - adapted from MedLEE lexicon 

%%%%%%%%%%%%%%%%%%% CLOSED WORD CATEGORY LEXICON %%%%%%%%%%%%%%%%%%%%%%%% 
%%%%%%%%%%%%%%%%%%%%% NEGATIONS %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% 

: -unknown (_, fail) . 

: -multifile (wdef/3) . 
wdef (cannot, neg, no) . 
wdef (neither, neg, no) . 
wdef (never, neg, no) . 
wdef (no, neg, no) . 
wdef (non, neg, no) . 
wdef (none, neg, no) . 
wdef (not , neg, no) . 
wdef (nothing, neg, no) . 

%%%%%%%%%%%%%%%%%%%%% CONJUNCTIONS %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% 

wdef ( ' & ' , conj , and) . 
wdef ( 1 / ' , conj , or) . 
wdef ( 1 - ' , grammar, ' - ' ) . 
wdef ( 1 + ' , conj , and) . 
wdef (although, conj , and) . 
wdef ~(and , conj , and) . 
wdef (as, conj , and) . 

wdef (because, conj , and) . _ _ = 

wdef (but, conj , and) . 

wdef ( ' , * , conj , * , 1 ) . 

wdef (except, conj , no) . 

%wdef (if , grammar, if ) . 

wdef (minus , conj , no) . 

wdef (nor, conj ,no) . 

wdef (or, conj , or) . 

wdef (that , grammar , that) . 

wdef (though, conj , and) . 

wdef (thru, conj , and) . 

wdef (verses , conj , or ) . 

wdef (versus, conj , or) . 

wdef (vs , conj , or) . 

wdef (when, grammar, when) . 

wdef (where, grammar , where) . 

wdef (whereas , conj , and) . 

wdef (which, grammar , which) . 

wdef (while , conj , and) . 

wdef (who , grammar , who) . 

wdef (yet , conj , and) . 

%%%%%%%%%%%%%%%%%%%%% PREPOSITIONS %%%%%%%%%%%%%%%%%%%%%%%%%%%%% 

wdef (above, ploc, above) . 

wdef (about, p, [approximately, nconn] ) . 

wdef (about , ploc, about) . 

wdef (across , ploc, across) . 

wdef (abutting, ploc, near) . 

wdef (accompanies, p, [with, conn] ) . 

wdef (accompanying, p, [with, conn] ) . 

wdef (adjacent, ploc, adjacent) . 

wdef (adjacent , region, adjacent) . 

wdef (after, p, [after, conn] ) . 

wdef (after, tprep, after) . 

wdef (along, p, [on, nconn] ) . 

wdef (approximately, p, [approximately, nconn] ) . 
wdef (around, p, [approximately, nconn] ) . 
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wdef (at ,p, [at , nconn] ) . 

wdef (atop,p, [on, nconn]) . 

wdef (before, ploc, before) . 

wdef (before, tprep, before) . 

wdef (behind, ploc, behind) . 

wdef (below, ploc, below) . 

wdef (between, ploc, between) . 

wdef (beyond, ploc, beyond) . 

wdef (by, ploc, near) . 

wdef (despite, p, [with, conn] ) . 

wdef (during, p, [during, conn] ) . 

wdef (during, tprep, during) . 

wdef (encasing, ploc, encasing) . 

wdef (extending, p, [in, nconn] ) . 

wdef (following, p, [after, conn] ) . 

wdef (following, tprep, after) . 

wdef (for, p, [for, nconn] ) . 

wdef (from, p, [from, conn] ) . 

wdef (in, p, [in, nconn] ) . 

wdef (including, p, .[.with, conn] ) t 

wdef (into, p, [in, nconn] ) . 

wdef (involving, p, [of , nconn] ) . 
O -wdef "(next rtprep ;nextf ) r 
\1 wdef (occupying, p, [in, nconn] ) . 
{J! wdef (on, p, [on, nconn] ) . 
™ wdef (of , p, [of , nconn] ) . 
=1 wdef (over , ploc, over) . 

wdef (overlie, ploc, over) . 

wdef (overlied, ploc , over) . 
|^ wdef (overlies , ploc , over) . 
""4 wdef (overlying, ploc, over) . 
z wdef (prior , tprep, before) . 
r| wdef (near, ploc, near) . 
K :l wdef (radiating, ploc, radiating) . 
l = - b wdef (regarding, p, [about , nconn] ) . 

"=3 wdef (roughly, grammar, roughly) . % 'roughly 6 mm' 

fll wdef (since, p, [since, conn] ) . 

wdef (since, status, subsequent) . 
^ wdef (through, p, [in, nconn]) . 

wdef (throughout , p, [in, nconn] ) . 

wdef (to, p, [to, nconn] ) . 

wdef (toward, p, [to, nconn] ) . 

wdef (towards , p, [during, conn] ) . 

wdef (under , ploc, below) . 

wdef (underneath, ploc, below) . 

wdef (until, tprep, until) . 

wdef (up, grammar, up) . 

wdef (upon, p, [on, nconn] ) . 

wdef (via, p, [with, conn]) . 

wdef (with, p, [with, conn]) . 

wdef (within, p, [in, conn]). 

wdef (without ,p, [no, conn]) . 

%wdef (without , neg, no) . 



%%%%%%%%%%%%%%%%%%%%%%%%%% UNITS OF MEASURE %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% 
wdef ( ' % ' , unit , percent ) . 
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wdef (cc, unit , cc) .. 

wdef (centimeter , unit , cm) . 

wdef (centimeters , unit , cm) . 

wdef (cm, unit , cm) . 

wdef (degrees , unit , degree) . 

wdef (gm, unit, gram) . 

wdef (gms , unit , gram) . 

wdef (gram, unit, gram) . 

wdef (grams, unit, gram) . 

wdef (kg, unit kilogram) . 

wdef (kilo, unit , kilogram) . 

wdef (kilogram, unit, kilogram) . 

wdef (kilograms , unit , kilograms) . 

wdef (liter , unit , liter) . 

wdef (liters, unit, liter) . 

wdef (microgram, unit, microgram) . 

wdef (micrograms, unit, microgram) . 

wdef (milliliter, unit , ml) . 

wdef (milliliters, unit, ml) . 

wdef (milligram, unit, mg) . 

■wdef (mi 1 1 igrams , lirii t , mg ) . 

wdef (milliseconds, unit, millisecond) . 

wdef (mill i volt s , unit , millivolt ) - 

wdef (ml , unit , ml ) . 

wdef (millimeter , unit , mm) . 

wdef (millimeters , unit , mm) . 

wdef (mm, unit , mm) . 

wdef (ozs, unit, ounce) . 

wdef (percent , unit, percent) . 

%%%%%%%%%%%%%%%%%%%%%%%%% NUMBERS %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% 

wdef (half , integer, ' one half). 

wdef (semi, quantity, semi) . 

wdef (ii, integer , 2) . 

wdef (iii , integer , 3 ) . 

wdef ( vi , integer , 4 ) . 

wdef (v, integer , 5) . 

wdef (vi , integer , 6 ) . 

wdef (vii, integer, 7) . 

wdef (viii, integer, 8) . 

wdef (ix, integer, 9) . 

wdef (xii, integer , 12) . 

wdef (xiii, integer, 13) . 

wdef (one, integer, 1) . 

wdef (two, integer, 2) . 

wdef (double, quantity, double) . 

wdef (three, integer, 3) . 

wdef ( four , integer , 4 ) . 

wdef (quadruple, quantity, quadruple) . 

wdef (five, integer, 5) . 

wdef (six, integer, 6) . 

wdef (sixty, integer , 60) . 

wdef (seven, integer, 7) . 

wdef (eight , integer , 8) . 

wdef (nine, integer, 9) . 

wdef (ten, integer, 10) . 

wdef (eleven, integer, 11) . 

wdef (twelve, integer, 12) . 
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thirteen, integer, 13) . 
fourteen, integer, 14) . 
fifteen, integer , 15) . 
sixteen, integer , 16) . 
seventeen, integer, 17) . 
eighteen, integer , 18) . 
nineteen, integer, 19) . 
twenty, integer, 20) . 
thirty, integer , 30) . 
forty, integer , 40) . 
fifty, integer , 50) . 
sixty, integer , 60) . 
seventy, integer , 70) . 
eighty, integer, 80) . 
ninety, integer , 90) . 
hundred, integer , 100) . 
thousand, integer, 1000) . 
million, integer, 1000000) . 
billion, integer , billion) . 
zero, integer, 0) . 
f irst , ointeger , 1) . 
second, ©integer , 2) . 
third, ointeger, 3 ) . 
fourth, ointeger , 4) . 
fifth, ointeger , 5) . 
sixth, ointeger , 6) . 
seventh, ointeger , 7) . 
eighth, ointeger , 8) . 
ninth, ointeger , 9) . 
tenth, ointeger, 10) . 
eleventh, ointeger , 11) . 
twelvth, ointeger, 12) . 
thirteenth, ointeger, 13) . 
fourteenth, ointeger, 14) . 
fifteenth, ointeger, 15) . 
sixteenth, ointeger, 16) . 
seventeenth, ointeger , 17) . 
eighteenth, ointeger, 18) . 
ninteenth, ointeger , 19) . 
triple, quantity, triple) . 
twentieth, ointeger, 20) . 
thirtieth, ointeger, 30) . 
single, quantity, 1) . 
solitary, quantity, 1) . 

frequency, grammar , frequency) . */ 
, grammar ,'.'). 
, grammar, 1 ; ' ) . 
, grammar ,'/')• 
, grammar , ' : 1 ) . 

, certainty, "moderate certainty') 
, certainty, 'high certainty 1 ) . 
* , grammar, ' 1 ' * ) . 



%%%%%%%%%%%%%%%%%%%% FREQUENCIES 
once, f req, 1) . 
times , grammar ,x) . 



%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%*% 



wdef (-twice, f req, 2) 
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% lexicon with lexOg containing common English words adapted from lexO of 
MedLEE% 

% lexlg from lexl of MedLEE 
% August 23, 1999 

%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%^ %%%%%%%%%%%%%%%% 
% CAROL FRIEDMAN % 

% QUEENS COLLEGE , COLUMBIA UNIVERSITY * 

% 

% Version 3.0 4-01-00 % 

% Version 2.0 1-31-96 % 

% Version 1.0 1-5-92 % 



% 
% 



% 



% 



% 
% 



% SEMANTIC LEXICON FOR CLINICAL TEXT % 



% 



% The lexicon consists of several files: * 

% lex0g.pl: single word closed classes % 

% lexlg.pl: single word - general modifier type words: % 

% 

% wdef (category, target) . ° 

% word - is the name of the word being categorized; % 

% category - is the semantic category for the word % 

% target - is the canonical /standard- form for the word % 

% " words which are synonyms should be assigned the same % 

% canonical form. % 

% multi-word phrases are categorized as follows: % 

% phrase (word, category , phrase , target) . * 

% % o 

% Semantic Categories: 



% 



% certainty "possible" % 

% canonical values limited to: moderate - for possible % 

% high - for high possible % 

% low - for low possible % 

% conj - relational operators "and", "or" , which connect one finding % 

% to another finding * 

% neg - negation "no", "not" 

% quant - for quantitative information "many" % 

: -unknown (_, fail) . 

: -ensure_loaded( [nsphrase, lexOg, lexlg, lexsemact, lexsyn, lexsub] ) . 
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% definitions kept from MedLEE lexicon - lexl.pl 

wdef (be, vbe, 'high certainty') . 

wdef (been, vbe, 'high certainty') . 

wdef (being, vbe, 'high certainty') . 

wdef (was, vbe, 'high certainty') . 

wdef (is, vbe, 'high certainty') . 

wdef (were, vbe, 'high certainty') . 

/* 

wdef (became, vcertainty, 'high certainty*) . 
wdef (become, vcertainty, 'high certainty') . 
wdef (becomes, vcertainty, 'high certainty') . 
wdef (becoming, vcertainty, 'high certainty') . 

put in action lexicon 
wdef (changed, change, change) . 
wdef (changes, change , change) . 
wdef (changing, change, change) . 
wdef (necessarily, certainty, 'high certainty') . 
wdef (necessary, vrecommend, recommended) . 
wdef (necessitate, vstatus , need) . 
wde f (nece s s i t a t e & , v s ta ir a & , nee d ) . 
wdef (necessitating, vstatus, need) . 
wdef (necessitates , vstatus , need) . 
wdef (need, vstatus , need) . 
wdef (needed, vstatus , need) . 
wdef (needing, vstatus, need) . 
wdef (needs , vstatus , need) . 
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% file ml_j?arser .pi 
:- multifile (phrase/5) . 
:- multifile (wdef/3) . 
: -unknown (_, fail) . 

% Load in program components - library components are part of Prolog 
:- ensure_loaded ( [library (basics) , library (not) , library (lists) , 

library (readin) , library (strings) , library (ctypes) , library (readconst) , 
library (date) , library (listparts) , library (sets) , 
radrec, radpardb, useful, util, tagging, lexicon, gengram] ) . 

%:- initialization run. 

%run :- on_exception (Error, processrun, stop (Error) ) . 
runtime_entry (start) :- processrun. 
runt ime_entry (abort) halt. 

% process report 

processrun :- process, halt. 

%stop (Error) :- 
% told, 

% write (user_error, 'Error : '), write (user_error, Error) , halt. 



% get user supplied parameters and process report 
process : - 

get_args (Mode, Inf ile , Outf ile , Prb, Undef s , Protocol) , 
(Examtype = [] ; % must have a domain 
process (Inf ile, Outf ile, Prb, Undef s) ) . 

% open Inf ile (text input) and process 
process (Inf ile, Outf ile , Prb, Undef s) : - 

see (Inf ile), seen, see (Inf ile), 

on_exception (Error, 

test_genome (Outf ile, Prb, Undef s) , 

app_errO (_, Outf ile, Error) ) , 
closefiles (Outf ile, Prb, Undef s) . 
process (_, Outf ile, _,_) : - 

app_err (_, Outf ile, 'Program failed') . 

app_errO (_, Output , Error) : - 

tell (Output) , 

write ( ' <error> ' ) , 

write ( ' Prolog Error occurred : * ) , 

app_err (_, Output f Error) . 
app_errl (_, Output , Error) : - 

tell (Output) , 

write ( ' <error> ' ) , 

write ( ' Error in input : ' ) , 

app_err (_, Output , Error) . 
app_err (_, Output, Error) : - 

tell (Output) , 

write (Error) , write ( 1 </error> • ) , nl . 

closefiles (Outf ile, Errf ile, Unfile) : - 
tell (Outf ile) , told, 
(Errf ile = [] ; tell (Errf ile) , told), 
(Unfile = [] ; tell (Unfile) , told). 



« -3" % 

% Argument options - get user defined arguments 

% -p ProbFile (otherwise default is problem messages are not written to file 
% -i Infile (if input is supplied by file and not standard input 
% -s Section (default is impression) 

% -m Mode (default is relax; the three choices are strict, relax, skip) 
% -o Outfile (if output should be file and not standard output) 
% -? Provide list of default arguments 

% -u Undefs (otherwise default is - undefined messages are not written 
% to a file) 

get_args (Mode, Infile, Outfile, Prbfile, Undefs , Protocol) : - 
unix (args (Args) ) , 
(Args = [] , ! , writesyntax; 
Args = ['?'],!, writesyntax; 
Args = [X | Rest] , ! , 

set_args( [x|Rest] , Mode, Infile, Outfile, Prbfile, Undefs, Protocol) ) . 

writesyntax : - 

write (user_error, 'geneparser [-m Mode] 1 ) , 
nl (user_error) , 

write (user_error, » [-t Outtype] [-p Probfile] L-u Undefs] ') , 

nl (user_error) , 

- write4user_er-ror, » - = ^[=-1- infile] [-o Outfile] V) , = . . __ 

nl (user error) . 
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% nsphrase.pl - contains words/phrases that are ignored 

nosem(both, [both] ) . 

no s em (however, [however] ) . 

nosem (selectively, [selectively] ) . 

nosem (specifically, [specifically] ) . 

nosem(the, [the] ) . 

nosem (a, [a] ) . 
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% file radpardb.pl 

% June 25, 1999 

% fail an unknown predicate 

: -unknown (_, fail ) . 
:- op<900, fy, [not,once]). % same priority and type as \+ 
: - op{700, xfx, [\=, ~=] ) . % same priority and type as = or == 

:- dynamic (sentno/1) . 
% \sem\radpardb.pl 

%parse_sentences (+Beg, -Fmt, -ParseErrors, -Undef ineds, -Unsents, +Section, 

% +UserMode, +Examtype , Sentno, Outsno, IncSno) 

% Beg is list of sentences, Fmt is list of target forms, 

% ParseErrors are a list of sentences which could not parse, 

% Undefineds is a list of undefined words in sentence 

% Unsents is a list of sentence containing undefined words 

% Section is the section of the examination, UserMode is the 

% parsing mode specified by user, 

% Examtype is the domain (type of exam) 

% Sentno is the number of the starting sentence 

% Outsno is the last sentence number + 1 

% IncSno is the amount that the sentence number should be increased 

% (i.e. it is 1 when called by parse_sects and 0 when in 

% recovery mode) — — 

% Each sentence is parsed independently. 

parse_sentences ( [] ,[],[],[],[] ,_,_,_/_/_/_> = - ! * %no more sentences 
parse_sentences (Beg, Fmtlist, Out fail , Outundef s, OutunSents , 
Section, UserMode, Examtype, IncSno) : - 
get_sentence (Beg, S, Rest) , 1 , 

( isidentif ier (S) , !, % ignore identifier sentences - parse remainder 
parse_sentences (Rest , Fmt 1 , Out fail , Outundef s , OutunSents , 
Section, UserMode, Examtype, IncSno) , ! , 
(outputform(htext) , S \= [■■'], !, IncSno \= 0, %0 means in recovery 

mode 

append( [ [ [sentence, S] ] ] , Fmtl , Fmtlist ) ; 
Fmtlist = Fmtl 

) 

% ( IncSno = 0 , ! ; % on same sentence in recovery mode 

% sentno (Sno), NewSentno is Sno + IncSno, 

% retract (sentno (_) ) , assert (sentno (NewSentno) ) 

%%) , 

% Incsno = 1, write (•***•) , write_list (S , 3 , _) , nl, !, 
% Incsno = 0, 

preprocess (S, Bs, Undef ,Semlist, strict) , % bracket and check for undefineds 

parse_modes (S , Bs , Semlist , Fmtl , Errors , Undef , Unsents , Section , Writef ail , 
Examtype, UserMode, IncSno) , % parse first sentence 

parse_sentences (Rest , Fmt2 , Moreerrors , Moreundef s , MoreUnSents , 

Section, UserMode, Examtype IncSno) , % parse remaining 
append (Errors, Moreerrors, Outf ail ) , % Combine failures 

(outputform (htext) , 

(Fmtl \= [] , IncSno \= 0, 
!, append ( [Fmtl] ,Fmt2, Fmtlist) ; % add extra bracket for 1st 
Fmt 2 = [] , Fmtlist = Fmtl , ! 
) 
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append (Fmtl, Fmt2, Fmtlist) 
) , % Combine targets 

append (Unsents, MoreUnSents , OutunSents) , % Combine sentences 
append (Undef ,Moreundefs,Outundefs) % Combine undefined words 

) . 

%parse_modes (+S, +Bs , +Semlist , -Fmt, -Failures, +Undef , -Unsents, +Section, 



% +WriteMessage, +Examtype, +Mode, +IncSno) 

% S is original sentence; Bs is sentence after lexical lookup 

% Semlist is list of semantic categories in sentence 

% Fmt is formatted output, 

% Failures is list of sentences/fragments which could not be parsed. 

% Undef are words not in lexicon, Unsents are sentences containing 
% undefined words 

% Section is name of section being processed 

% WriteMessage is message returned from doresult (in case doresult fail 

% Examtype is domain, Mode is user specified mode 

% IncSno is 0 if this is a fragment of a sentence that was already 
% parsed - but unsuccessfully; is l if this is a new sentence 



% Best possible - try to get the most accurate parse possible trying 
% all alternative strategies in -turn if neccessary ._ 
% All words in sentence are defined 

parse_modes (S,Bs, Semlist, Fmt, Errors, [] , [] , Section, no, Examtype, Pmode, 
Inc) :- 

(Pmode = bpseg, Pmodemod = mode2, !; %in recovery mode 
Pmode = bpseg2, Pmodemod = mode 2 , ! ; 
Pmode = bps eg 3 , Pmodemod = mode 2 , ! ; 

Pmode = bpskip, Pmodemod = 'mode4 , !; %in recovery mode 

% in user specified parse mode - don't parse in mode 5 or keyword 
Pmode \= keyword, Pmode \= mode 5, 
Pmodemod = model 
) , 

dosent (S , Bs , Semlist , Fmtl , Message , Section, _, Examtype, Pmodemod, _) , ! , % 
strict first 

recovery (_,S,Bs, Semlist, Fmt2, Message, Errors, [] , [], Section, 

Pmode, Examtype, _) , % try alternative modes if neccy 
( output form(htext) , Inc \= 0, !, append ([[ [sentence, S] ], Fmtl , Fmt 2] , Fmt) 
append ( Fmt 1 , Fmt 2 , Fmt ) 
) . 

% alternative strategies if have undefined words 

parse_modes (S , Bs , Semlist , Fmt , Errors , Undef , Unsents , Section, no , Examtype , 
Pmode , Inc ) : - 
Undef \= [] , 

recovery (_, S , Bs , Semlist , Fmtl , yes , Errors , Undef , Unsents , Section , 

Pmode, Examtype, _) , % try alternatives if have undef ineds 
(outputform(htext) , Inc\= 0, !, append ([ [sentence, S] ], Fmtl, Fmt) ; 
Fmt = Fmtl 
) • 

% key word strategy is fastest but least reliable-; 

parse_modes (S , Bs , Semlist , Fmt , Errors , Undef , Unsents , Section , no , Examtype , 
Pmode , Inc ) : - 
(Pmode = keyword; Pmode = mode 5 
; Pmode - mode 5) , 

recovery ( 5 , S , S , Semlist , Fmtl , yes , Errors , Undef , Unsents , Section , Pmode , 
Examtype ,_) , 

(outputform(htext) , Inc \= 0, !, append ([ [sentence, S] ], Fmtl , Fmt) ; 
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Fmtl = Fmt 
) . 

% Parsing/Recovery modes 

% parse_modes <+Level , +S, +Bs, +Sem, -Fmt , +Failed, +Undef , +Unsents , +Section, 

% +Pmode , +Examtype , _) 

% Level is the recovery level of the predicate 

% S is the original sentence list 

% Bs is the 

% Sem is the list of semantic categories in the sentence 
% Fmt is the formatted output for the sentence 

% Failed is 'yes' if the parse was unsuccessful, and 'no' otherwise 

% Undef is a list of words in sentence which are undefined (not in lexicon) 

% Unsents are the lists of sentences/segments which could not be parsed. 

% Section is the section of the report 

% Pmode is the user specified parse mode 

% Examtype is the domain 

% mode 1 is the strictest parsing mode - the parser succeeded for the complete 
% original sentence using the grammar; all words in original sentence 

% are defined in lexicon 

% mode 1 - alternative not needed because parse succeeded 

recovery (1, □ ,no, [] , Undef , Unsents , _) :- ! . 

% - no alternative strategy allowed in mode 1 

% in case where there are no undef ineds, Noparse is S 

recovery ( 1,S,_,_, [] ,yes,S, [] , [] ,_, Pmode ,_, _) :- 

Pmode - strict; Pmode = model, I. 
% in case there are undef ineds, Unsents is S 

recovery ( 1 , S , _ , [] , yes , Noparse , Undef , Unsents , _, Pmode , _, _) : - 

(Pmode = strict; Pmode = 'model'), 

Undef \= [] , Unsents = S, Noparse = [] , ! . 
recovery (1, S,_, Semlist , [] / yes, S, _,_,_,_,_,_) :- 

% sentence contains no relev. information, don't try to recover 
% \+ (subtype (finding, Semlist) ; subtype (time , Semlist )) , !. 

\+ actionchk (Semlist) . % april 23, restored 

% mode 4 - skip undefined words and try to parse according to mode 1 
recovery (4 , S , _, Fmt , yes , Errors , Undef , [ ] , Sect , Pmode , Examtype , _) : - 
Undef \= [] , 

(Pmode - bp; Pmode = mode 4 ; 

Pmode = bpseg; Pmode = bpskip; Pmode = mode4 
) , 

preprocess (S,Bs,_, Semlist , bpskip) , 

dosent (S , Bs , Semlist , Fmtl , Message, Sect ,_, Examtype , mode4 , _) , ! , 
recovery (_,Bs,Bs, Semlist, Fmt2, Message, Errors, [] , [],Sect, 

bpskip, Examtype, Sentno) , % try alternatives if neccy 
append ( Fmtl , Fmt2 , Fmt ) . 

% mode 3 - try longest parsed segment; partition rest of 
% sentence using mode 5 for parse mode bp 

recovery ( 3 , S , Bs , _, Fmt , yes , Errors , Undef , Unsents , Sect , Pmode , Examtype , _) : - 
% allowable modes for choosing longest segment 
(Pmode = bp; Pmode = bpskip; 

Pmode = skip; Pmode = mode3; Pmode = mode4; 

Pmode = bpseg3; Pmode = bpseg 
) , 

(Pmode = bpskip, Pmodemod = mode4_3 ; 
Pmodemod = mode 3 
) , 

checkst (sem_j>at tern, _,s, Target, Bs, Rest) , %check symbol table 
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%dooresult (Target, Fmtl, Examtype, Sect, Pmodemod,_) , 
formatresult (Target , Pmodemod, Fmtl) , 
(Pmode = mode3, Fmtlist = [] , Errors = Rest; 

recovery ( 5 , Rest , Rest , Fmtlist , yes , Errors , Undef , Unsents , Sect , 
Pmode , Examtype , _) 

) , 

append (Fmtl, Fmtlist, Fmt) . 
% mode 2 segments sentence using word barrier methods. This mode is tried if 
% parse failed for original sentence/or there are undefined words 

% segment sentence using word barriers 

recovery (2 , S , _, Fmt , yes , Errors , Undef , Unsents , Sect , Pmode , Examtype , _) : - 
(Pmode = bp; Pmode = bpskip; Pmode = mode2 ; Pmode = skip; 
Pmode = mode2; Pmode = mode3; Pmode = mode 4 ; 
Pmode = bpseg; Pmode = bpseg2 ; 
Pmode = bpseg3 
) , 

segmentandparse (S, Fmt, Errors, Unsents, Sect, Pmode, Examtype, _) , ! . 
% mode 5 - try to partition sentences by findings 
% when a finding in sentence is found, go left until first 
% modifier is found (if 2 findings are next to each other, 2nd one 
% is considered the finding and 1st is considered the modifier) 
-— =%— Repeat searching— for successive— findings using -this ^method 
recovery(5, [] , [] ,_, [] ,_, [] ,_/_,_,_/_/_) - ~ ! * 
recovery ( 5 , S , Bs , Fmt , yes , Errors , Undef , Unsents , Sect , 
Pmode, Exam type, _) :- 
(Pmode = bp; Pmode = bpskip; Pmode = bpseg; Pmode - keymode; 
Pmode = modeB ; Pmode = negmode 
) , 

preprocess (S,Bsl,_,_, bpskip) , % skip undefined words 

actionfindingseg (Bsl,Fseg, Before) ,! , % get segment containing finding 
(Fseg = [] , Errors = S, ! ; % no finding to segment 
%Before = [] , Errors = Bs, Fmtl =[],!; % this part was tried 
preprocess (Fseg, Bseg, _, Semlist, bpskip) , 
dosent ( Fseg , Bseg , Semi ist , Fmtl , Message , Sect , Examtype , 
modeB, _) % try to parse finding segment 

) , 

(Before = [] , Beforel = [] , Message = yes, !; % no segmenting yet - 

skip beg. 

Message = yes, Beforel = Before, I; %don't add *.*; have to skip 

more 

append (Before, [' . •] , Beforel) 
) , 

( Fseg = [] , Fmt =[],!; % no finding left in sent. - don't recover 
recoverrest (Fseg, Beforel , Fmt2 , Message , Errors , 
Sect, Newmode, Examtype ,_) , 

% recover remainder 

append ( Fmtl , Fmt 2 , Fmt ) 
) . 

% nothing could be recovered; all input -> Errors ; Format is [] 
recovery (__, Sents,_,_, [] , yes , Sents, Undef , [] ,_/_,_/_) • 

% part of phrase was skipped, add period and treated skipped part as a 
% sentence 

% recoverrest (+Segment , +Semlist , +Before, -Fmt, -i-Message, -Failures , +Section, 
% +Mode , +Exam t ype ; _ ) 

% Segment is part of sentence with a finding 
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% Semlist is a list of semantic categories for that sentence part 

% Before is the part of sentence before Segment 

% Fmt is the format for this segment 

% Message is 'no' if there is no segmantic information to be recovered 
% Message is 'yes' otherwise 

% Failures are lists of segment (s) that could not be parsed successfully 

% Section is section being processed, Mode is user specified parsing mode 

% Examtype is domain 



recoverrest (_,_/ Before, [] , no, Beforel ,_,_»_, _) =- 

(Before = [] , Beforel =[],!; % nothing was skipped 
append (Before, [» . •] , Beforel) 
), !. 

% nothing left to recover; write phrase that was skipped 
recoverrest ( [] ,_, Before, [] , yes, Beforel, _,_,_,_) :- 

(Before = [] , Beforel = [] , !; 

append (Before, [' . '] , Beforel) 

>, !• 

% can recover partial parse 

recoverrest (Bs, _, Before, Fmt , yes, Errors, Sect, Pmode, Examtype, _) : - 

checkst (semjjat tern, _,s, Target, Bs, Rest seg) , % recover from symbol tab. 
%doresult (Target , Fmtl , Examtype , Sect , modes , _) , 
. formatresult (Target, mode5, Fmtl) , .. 

recovery ( 5 , Rest seg , Rest , _ , Fmt 2 , yes , Error2 , 

[] , [] , Sect, Pmode, Examtype, _) , 
append (Fmtl, Fmt 2, Fmt) , 

(Before = [] , Errors = Error2 , !; %nothing skipped to add ' . ' to 
append (Before, [' . • |Error2] , Errors) 
) . 

% cannot recover partial parse - skip first element and retry 
% if 1st element is a negation semantic type, skip 2nd element instead 
% Handles case where 1st element is a negation, certainty or status 

% add 2nd element to unparsed sentences list (enlcosed in angle brackets) . 

recoverrest ( [X , Y | Restseg] , _, Beforel , Fmt , yes , Errors , 

Sect , Pmode , Examtype , _) : - 
foundword(X, Semi, Tar) , 

( member(Seml, [neg, certainty , vcertainty, vconn, status , vstatus] ) ; 
Semi = p, Tar = [_, conn] 

>, 

%(Mod = neg; Mod = certainty; Mod = status; Mod = vcertainty), % leave 
this mod in 

preprocess ( [X | Restseg] , FsegO bpskip) , % skip undefined words 
findingseg(FsegO,Fseg,Before2) , !, % get finding seg 
(Fseg = [] , Errors = [X, Y| Restseg] , Fmt = [] ; % no finding 
preprocess (Fseg, Bseg,_, Restsem, bpskip) , % skip undefined words 
dosent ( Fseg , Bseg , Restsem , Fmt 1 , Mes sage , Sect , _ , Examtype , 

modes, _) , % try to parse finding segment 
recoverrest (Fseg, [Y|Before2] , Fmt2 , Message, Error2 , 

Sect, negmode, Examtype, _) , % recover remainder 
(Beforel = [] , Errors = Error2, !; 
append (Beforel, [. |Error2] , Errors) 
) , 

append (Fmtl , Fmt 2 , Fmt) 
) . 

% skip 1st element; enclose it in brackets 
recoverrest ( [X | Restseg] , Beforel , Fmt , yes , Errors , 
Sect , Pmode , Examtype , _) : - 
preprocess (Restseg, FsegO, bpskip) , 
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findirigseg(FsegO,Fseg / Before2) , !, % get finding seg 
append (Bef orel, [X|Before2] , Before) , 

(Fseg = [] , Errors = [X|Restseg], Fmt = [] ; % no finding 
preprocess (Fseg, Bseg, _, Restsem, bpskip) , 
dosent (Fseg,Bseg, Restsem, Fmtl, Message, Sect, _,Examtype, 

modeS, _), % try to parse finding segment 
recoverres t ( Fseg , _ , Before , Fmt 2 , Message , Errors , 

Sect,Newmode, Examtype,_) , % recover remainder 
append ( Fmt 1 , Fmt 2 , Fmt ) 
) . 

% no semantic information left; return Errors 
recoverrest ( [X|Restseg] , [] , Beforel, Fmt ,yes, [x|Restseg], 
Sect,Pmode,Examtype,_) . 

%dosent (+S, +Bs, +Semlist , -Fmtlist , +Message, +Section, +WriteMessage , +Examtype, 
% +Mode) 

% S is original list of words in sentence; Bs is list after lexical lookup 

% Semlist is list of semantic categories corresponding to Bs 

% Fmtlist is list of target forms for sentence 

% Message is 'yes* if the output from parser signals a failure, 

% and -'no 1 - otherwise . -_, 

% Section is section of examination being processed 

% WriteMessage signals whether an error occurred in generating target form 

% Examtype is the domain, and Mode is the user specified mode of parsing 

% Parse sentence and returns target in nested format 

% Handles case where sentence should be skipped because info is about 
% family member or peripheral to patient 
dosent (S,_, Semlist, [] # Error _) : - 

skipsentence (S, Semlist , Error) , ! . 
dosent (S , Bs , Semlist , Fmtlist , Errormsg , Sect ion, Writef ail , Examtype , Mode , _) : - 
attemptparse ( P , Bs , sentence , Semi ist , Section , Atotal ) , 

( P = [failure] , Errormsg = yes, Writef ail = no, ! % parse failure 

P = [] , Errormsg = no, Writefail = no, Fmtlist = [] , ! % empty target 

%doresult (P , Fmtlist , Examtype , Section, Mode , _) , 
formatresult (P, Mode, Fmtlist) , 
Errormsg = no, Writefail = no, ! 

Errormsg = yes, Writefail = yes, 1 

) . 

%parse_sentences (Beg, Beg, [] , □,_#_,_) *- — 

% attemptparse (-P, +Bs, +Structure, +Semlist, -Ftype, -Total) 



% P is output from parser 

% Bs is list of words in sentence after lexical lookup 

% Structure is name of structure to be parsed 

% Semlist is list of semantic categories corresponding to elements in Bs 

% Total is number of times parser reached sem_sent in grammar; 

% where sem_sent is highest level predicate in grammar 

% don't parse if sentence consists of only '.' or ! ;' 
attemptparse ( [] ,Bs, _,_,_,_) : - 
Bs = ['.»]; Bs = [';']. 



% if a template exists for whole sentence, get parse from it 



attemptparse (P,Bs, sentence^, _,_) : - 

Bs = [X,'.'], is_list(X), % the whole sentence is a finding 
f ind_sem_sent (P, X) , ! . 

% parses and retracts wellformed string table - parses sentence 
attemptparse (P,Bs, sentence, Semi ist, Ftype, Atotal) : - 

ret rac tall (wf st (_,_,_, _,_/_) ) , 

retractall (addstotal (_) ) , 

sem_sent (P, Semlist, Atotal, Bs, t] ) , ! - 

% parses and retracts wellformed string table - parses bodypart only 
attemptparse (P, Bs , bodypart , _,_,_) : - 

sem_bodyloc (P,Bs, [] ) , 

retractall (wf st (_/_,_/_#_#_))/ I * 

%segmentandparse ( +Sentences , - Fmtlist , - Failures , -Unsent , +Sect ion, +Mode , 



% +Examtype , +Sentno) 

% Sentences is list of sentence segments. 

% Fmtlist consists of the formatted output for the segments 

% Failures is the list of unparsed segments. 

% Unsent is the list of segments with undefined words. 

% Section is the section being processed, Mode is the user specified mode 

% Examtype is the domain and Sentno is the sentence id. 



segment andparse ([],[],[],□,_,_,_,_) : - ! • 

segmentandparse (Sentences, Fmtlist , Failures, UnSent, Section, Mode, 
Examtype , Sentno) : - 
get_sentence (Sentences, S, Rest) , !, %sentence to segment 
preprocess(S,Sl,_,Semlist,Mode) , ! , 
(Mode = mode2, NewPmode = bpseg2 , !; 
Mode = mode3, NewPmode = bpseg3, ! ; 
NewPmode = bps eg 
>, 

( segmentl (SI, Segs, [] , seg) , !, 

parse_sentences ( Segs , Fmt 1 , Fails , _, Unl , Section, NewPmode , Examtype , 
Sentno , Sentno , 0 ) , ! 
; segment2 (SI, Segs, [] , seg) , !, 

parse_sentences (Segs , Fmtl , Fails Unl , Section, NewPmode , Examtype , 
Sentno , Sentno , 0 ) , ! 
; segment 3 (SI, Segs, [] , Negstatus , seg) , !, 

parse_sentences ( Segs , Fmtl , Fails , _, Unl , Section , NewPmode , Examtype , 

Sentno, Sentno, 0) , ! 

) , 

% fails if cannot segment sentence; otherwise segments remainder 
segmentandparse (Rest , Fmt2 , Nexterrors , NextUns , Section , Mode , 

Examtype, Sentno) , 
append (Fmtl, Fmt2, Fmtlist) , 
append (Unl , NextUns , UnSent ) , 
append (Fails , Nexterrors , Failures) , ! . 

%segmentl (+S, -Segs, +Beg, +Message) 



% S is list of words in sentence 

% Segs consists of sentence segments as separate sentences 

% Beg is list of words in sentence prior to the current portion of sentenc 

% Message is 'seg' if segmenting succeeded and 'noseg' otherwise 



segmentl ([],[] ,_,noseg) :- !. 

% segment sentence at connect phrase/word or at most conjunctions 
% if negation precedes, restore negation 
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segmentl { [X | Rest] , [ » . ■ , ' <eos> ' | Rem] , Beg, seg) : - 

\+ sem_endmark(Rest / [] ) , % don't segment if at end already 
foundword(X, Sem, Target ) , % get semantic classification and target 
( X = nor, append { [no] , Rest, Rem) % ok to segment at nor 

;X = without, append ( [no] , Rest, Rem) % ok to segment at without 

%;X = ' : ' , Rest = Rem 

; Sem = neg, Rest = [Next | Rest2] , % have negation; test word after 
foundword(Next, Sem2 , Target2) , % for connective - add back negation 
testforconn(Next,Sem2,Target2) , Rem = [X|Rest2] 
; testforconn(X, Sem, Target) , Rest = Rem 
) . 

segmentl ( [X | Rest] , [X | Newrest] , Start , Seg) :- 

append (Start, [X] , Beg) , % part before segmentation 
segmentl (Rest , Newrest, Beg, Seg) . 

testforconn (X, Sem, Target) : - 

{ Sem = p, Target = [P,conn],P\= with % segment at connective prep 
; member (Sem, [vconn, vshow] ) % segment at these types of verbs 
; Sem = conj, \+ member (X, [and, or, ' , ' , '/' /^s] ) 
) . 

% segment at certain words ----- • 
segment2 ([],[],[] ,noseg) :- ! . 

segment2 (S, Segs, [] , seg) : - 
seg2 (S,Rest, Segs) , 
\+ sem_endmark (Rest , [] ) , ! . 
segment2 ( [X | Rest] , [X | Newrest] , [] , Seg) : - 

segment2 (Rest, Newrest, [] ,Seg) . 
seg2 ( [X | Rest] ,Rest, [■ . ' , '<eos>' |Rem] ) :- 

member (X, [which, that , until , where , when , while , who , 
1 (', ') ', between, whereby, after, before, prior, 
greater, ranging] ) , 
Rem = Rest, ! . 

segment3 ([],[] ,_,_,noseg) :- !. 

% segment at conjunction - if negation preceded conjunction, add 
segment3 ( [x|Rest] , Rem, Beg, Negstatus , seg) :- 

\+ sem_endmark(Rest, [] ) , !, % already at end of sentence 
seg3 ( [X | Rest] , Rem, Beg, Negstatus , seg) , ! . 

seg3 ( [X | Rest] , Rem, Beg, Negstatus , seg) : - 
wdef (X, conj ,_) , 
member (X, [and, or, ',']), 

(nonvar (Negstatus) , Rem = [».', Negstatus | Rest] , ! %restore negation 

; Rem = [*.',' <eos> ' | Rest] , ! 
) . 

seg3( [X | Rest] , [X, ' . ■ , '<eos>' |Rest] ,_,_,seg) :- 
f oundword(X, age) , ! . 

seg3 ( [X | Rest] , [X [Newrest] , Start, Negstatus, Seg) 

( nonvar (Negstatus) , !; % 1st neg already found - continue segmenting 
f oundword (X, Sem, Target) , ! , 

( Target = no, Negstatus = X, ! ; 
Sem = neg, Negstatus = X, ! ; 
Sem \= neg, Target \= no, ! 

) ; 



no 

true, ! % word is undefined 
) , 

append ( Start , [X] , Beg) , % part before segmentation 
segment 3 (Rest, Newrest, Beg, Negstatus, Seg) , ! . 

% for finding type classes - parse as a sentence 
whattoparse (Sem, P, Sent) 

member (Sem, [cfinding,pf inding, morph, disease, device, proc,mproc, descriptor] ) , 
attemptparse (P, Sent, sentence, [Sem] , impression, _) . 

% for bodyloc classes - parse as a bodyloc modifier 
whattoparse (Sem, P, Sent) : - 

member (Sem, [bodyloc, region, side, position] ) , 

attemptparse (P, Sent , bodypart _) . 
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% file radrec.pl 
% September 7, 1999 
% fail an unknown predicate 
: -unknown (_, fail) . 

op(900, fy, [\+, not, once] ) . % same priority and type as \+ 

op(700, xfx, [\=,~=]). % same priority and type as = or == 

dynamic (domain/ 1) . % domain being processed 

dynamic (output form/1 ) . % form of output (needed to distinguish 

% markup of text from formatting forms 
:- dynamic (currentsect/1) . % section for outputting results 

test_genome (Outf ile, Errfile, Unfile) : - 

get_inputsents ( [] , Toklist) , !, % read in and tokenize input 
(Toklist = [],!, % error condition 
app_errl (_, Outf ile, 1 No input sent 1 ), 1 

parse_sentences (Toklist , Fmtlist , Failed, Undef , UnSent , impression, 
bp, genome, 0) , ! , 

outputresults (Fmtlist, Failed, Errfile, Undef, Unfile, UnSent, Outf ile, 
full, line, genome, 1, G,_, exe, plain) 

) . 

outputresults (FmtlistO , Failed, Errfile , Undef , Unfile , UnSent , Out file , 

Amount , Type, Exam, Compno, Doc Comp, NewCompno, Caller , Protocol) 
tell (Outf ile) , 

(Protocol = sgml, ! , Op = sgml; 
Caller = server, ! , Op = sgml; 
Op = plain) , 

(Type = nested, ! , % original output form - nested findings 
write ( ■ <nested> • ) , new_line (Op) , 
write (Fmtlist) , new_line (Op) , write ( ' </nested> 1 ) , 
new_line (Op) , ! 

) , 

(Caller = server, 

write_message (Unfile, Undef , Caller, ' < undef ined> ' , 1 < /undef ined> 1 ) 
Caller = exe, Undef \= [] , 

write_message (Unfile, Undef , Caller, 1 ***** Undefined Words *****',[]) 
%write_highlight ( [] , UnSent , Caller) 

true 
) , 

(Caller = server, 
write ( ' <noparse> ' ) , ! , 
write_highlight (Undef , UnSent , Caller) , 

writejiighlight ( [] , Failed, Caller) , write (* </noparse> ' ) 

Caller = exe, Errfile \= [] , Failed \= [] , 
tell (Errfile) , 

write ('***** Sentences/Phrases Not Parsed **+**'), nl, 
%write_highlight (Undef , UnSent, Caller) , 
write_highlight ( [] , Failed, Caller) 

true % no Errfile to write to 
) . 

% set_args : Process options 



% Argument options 

% -p ProbFile (otherwise default is problem messages are not written to file) 

% -i Infile (if input is supplied by file and not standard input 

% -m Mode (default is bp; the 6 choices are bp, model - modeS) 

% -o Outfile (if output should be file and not standard output) 

% -? Provide list of default arguments 

% -pr Protocol - sgml or plain (default is plain) 

% -u Undefs (otherwise default is - undefined messages are not written 
% to a file) 

set_args ( Args , Mode , Infile , Outfile , Prbf ile , Undef , Protocol ) : - 
set_mode (Args, Mode) , set_amount (Args, Amount) , 
set_protocol (Args , Protocol) , 

set_inf ile (Args, Infile) , set_outf ile (Args , Outfile) , 
set_prbf ile (Args, Prbf ile) , set_undefs (Args , Undef ) . 



set_mode (Args , Mode ) : - 

(nextto( ' -m 1 ,M,Args) ; nextto (m, M, Args) ) , ! , 

modeis (M, Mode) , 1 . 
set mode(_,bp). % default output type 



n 



modeis (relax, mode2 ) :- ! 

modeis (strict j model ) : - 
i~3 modeis (skip, mode4) :- !. 

modeis (longest , mode3) :- 
|f| modeis (best , bp) :- !. 
a ";^ modeis (model , model) 
, modeis (mode2 , mode2 ) 
^ modeis (mode 3 , mode 3 ) 

modeis (mode4 , mode4 ) 
j/; modeis (modes , mode 5) 

s set_protocol (Args , Protocol ) : - 

□ (nextto ( * -pr ■ , Protocol , Args ) ; nextto ( ' pr ' , Protocol , Args ) ) , 

-11 member (Protocol, [sgml, plain] ) , ! . 

j: : b set_protocol (_, plain) . 
J;: set_undefs (Args, Undefs) :- 

nextto ( 1 -u r , Undefs, Args) ; nextto (u, Undef s , Args) , !. % undef file option 
set_undef s (_, [] ) . % default is no file of undef ineds created 

set_inf ile (Args , Infile) :- 

nonvar (Infile) , !; % Infile is set already 
nextto ( * -i ' , Infile, Args) , ! ; 
nextto (i, Infile, Args) , ! . 
set_inf ile (_, user_input) . % default is standard input 

set_prbf ile (Args, Prbf ile) :- 

nextto C-p' , Prbf ile, Args) , i ; nextto (p, Prbf ile, Args) , ». % prob file option 
set_prbfile(_, [] ) . % default is no file of problems is created 

set_outf ile (Args , Outfile) 

nonvar (Outfile) , ! ; % Outfile is already set 

nextto (' -o' , Outfile, Args) , !; nextto (o, Outfile, Args) , !. % outfile option 
set_outfile(_,user_output) . % default is standard output 

new_line (sgml) :- write (• <br> 1 ) , nl, !. 
new_line (server) :- write ( 1 <br> '). nl , !. 
new line(exe) :- nl . 
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new_line (plain) : - nl . 
write_message (_,[], exe,_,_) :- !. 
write_message ([],_, exe,_,__) :- !. 
write_message (_, [] ,plain,_,_) :- ! . 
write_message ( [] plain, _) : - ! . 

write_message (File, Contents, Caller, Begmsg, Endmsg) : - 
( member (Caller, [exe, plain] ) , tell(File), ! 

true) , 

write (Begmsg) , new_line (Caller) , 

(Contents = [] ; write_list (Contents , 1) , new_line (Caller) 
), 

(Endmsg = [] , ! ; 

write (Endmsg) , ! , new_line (Caller) 
) . 

sentend( [X|_] , Caller) :- 

member (X, [ » . ' , * ; • , ' ? ' ] ) , new line (Caller) , ! . 



gettargetsf [],[]) :- ! . 

gettargets ( [ignore | Rest] , [ignore | Rest] ) :-]..% possibly ignore info. 

□ gettargets ( [Wl | Rest] , [Tl|Trest]) :- 

*3 foundword(Wl,_,Tl) , % target for Wl 

Li! gettargets (Rest , Trest ) , ! . 

n« gettargets (W,W) . % not in lexicon 
isneg(X) :- 

intersect (X, [no, negative , deny, 'rule out'] ) . 

writeoutsent ( [Word] Rest] ) : - 

write ( ' ' ' ' ) , write (Word) , write ( ' ' ■ ' ) , ! , 
2 (Word = ' ' ' ' , write ( ' » ' • ) , ! ; true) , 

□ (Rest \= [] , write (»,'), ! , writeoutsent (Rest) , ! ; 

B « true) , ! . 

i . 

u 



% This file contains predicates associated with SGML tags 
% nextTag (+L,Tag, -PreTag, -PostTag) is true if 
% L is the starting List 

% Tag is an SGML tag; it could be a variable or instantiated already 

% PreTag is portion of L preceding Tag 

% PostTag is portion of L following Tag 

nextTag (L, Tag, PreTag, PostTag) : - 

append (PreTag, [ '< ' ,Tag, ' >' | PostTag] ,L) . 

% endTag (+L, +Tag, -Pre, -Post) is true if 
% L is the starting list 

% Tag is the SGML end tag 

% Pre is the portion of L preceding the end of tag 

% Post is the portion of L following the end of tag 

endTag (L, Tag, Pre, Post) : - 

append ( [Pre, [•<• , '/' ,Tag, '>»] ,Post] ,L) . 

% enclosedPart <+L, +Tag, -Enclosed) is true if 

% L is the starting List; it is assumed that L is portion of some 

% list that follows a begin tag - i.e. 1 <',Tagj'L 

% Tag is the SGML tag 

% Enclosed is the portion of text enclosed in tag; not including 

% end tag. 

enclosedPart (L, Tag, Enclosed, Post) : - 
endTag (L, Tag, Enclosed, Post) . 
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% file useful.pl - lexical lookup and utility tools 

: -unknown (_, fail) . 

: -dynamic (sentence/1) . 

:- op(900, fy, [not, once]) . % same priority and type as \+ 

:- op(700, xfx, [\=,~=]). % same priority and type as = or == 

% useful.pl February 21, 1992 

% 

% preprocess (+S,+Bsl, -U, -Sem3,+Mode) : preprocesses sentence to 

% bracket lexical phrases and remove words/phrases in 

% special db of noise words (nosem in nsphrase.pl db) 

% S is original sentence 

% Bsl is preprocessed sentence 

% U is list of undefined words in sentence 

% Mode is mode of process - in skip mode undefined words are removed 

% from preprocessed sentence 

preprocess (SO, Bsl, U, Sem3,Mode) : - %cfnew 

checkbeg(SO,S) , % if beginning is 1 A) ' ignore 

checkphrase(S,Sl,Seml) , % bracket all phrases in phrasal lexicon first 
checklist (SI, Ul / Bs,Sem2, Mode) , % check that all words are in lexicon, remove 
non semantic 

checklist (Bs,U, Bsl, Sem3, Mode) . % check for phrases after non-sem are removed 
%append (Semi, Sem2, Semi) , -= - 

%append (Semi , Sem3 , Semlist) , 

%union (Ul , U2 , U) . 

% found checks if word X is defined as a single word, or if X starts a defined 
% phrase 
foundword(X) :- 

wdef(X,_,_), !. 
foundword(X) :- 

semw (X, _,_,_) , ! . 
%definition from tagged input 
foundword(X) :- 

phr(X,_,_,_) , !. 
f oundword ( [X | Rest] ) : - 
Rest \= [] , 
phrasal (X,_, [X|Rest] ,_) , ! . 
% 3/99 added f oundword to search the new semact.pl lexicon 
% phrasal using semp was added to util.lp 
% found/2 returns semantic cat. of word 
f oundword (X , Sem) : - 
wdef (X, Sem,_) . 
f oundword (X , Sem) : - 

semw (X, Sem, _,_) . 
%definition from tagged input 
f oundword (X , Sem) : - 

phr (X, Sem, [],_). 
f oundword ( [X | Rest] , Sem) : - 

phrasal (X, Sem, [X | Rest] , _) . 
% found/3 returns semantic cat. and target form 
f oundword (X , Sem , Form) : - 

wdef (X, Sem, Form) . 
f oundword (X , Sem , Form) : - 

semw (X, Sem, Form, _) . 
%definition from tagged input 
f oundword (X, Sem, Form, _) : - 

phr (X, Sem, [] , Form) . 
f oundword ( [X | Rest] , Sem, Form) : - 



phrasal (X, Sem, [X|Rest] , Form) . 

%collectsem (4-Word, -Sem) : Sem is the list of semantic classes corresponding 
% to Word 

collectsem (Word, Sem) :- 

setof (X, foundword(Word,X) ,Sem) . 
% missing checks if a word present in a sentence is defined 
missing (X) :- 

member (X, S) , 

not foundword(X) . 

% checkbeg (+S0, -S) checks beginning of sentence; if it begins with a letter or 
% number followed by a ' ) ' , that part is skipped 
checkbeg ( [X, ')' |Rest] , Rest) :- !. 
checkbeg (X,X) . 

% checks every word in a list to see if it is defined; creates 
% a new list of words not defined, and a new list of sentence 
% where phrases are bracketed, 
checklist ( [] ,[],[],[],_). 

% if X is a list it has already been identified as a phrase in phx<4-»al lex 
checklist ( [X | Rest] , Undef, Ne wrest , Semi is t, Mode) : - 
— - ■ is_list (X) , - — • - • - 

J J check_no_sem ( [X | Rest] , Restl , _) , 

'%3 checklist (Restl, Undef , Newrest , Semlist , Mode) , !. %is phrase part of nosem 

Iff checklist ( [X|Rest] , Undef, [X| Newrest] , Semlist , Mode) :- 

%collectsem (X, Sem) , 
□ is_list(X), X= [Wl|Tail], 

^1 phrasal (Wl,Sem,X,_) , 

aj'l checklist (Rest, Undef , Newrest, Sem2, Mode) , !, 

y 1 ]. append ( [Sem] , Sem2 , Semlist) . 

checklist ( [without | Rest] , Undef , Newrest , Semlist , Mode) :- 
* checklist ( [with, no | Rest] , Undef , Newrest , Semlist , Mode) . 

i=l % this problem has to be fixed in preprocessor 

% check for a number with a ' , ' - "11,200" and fix it 
U %checklist ( [X, ' , ' ,Y|Rest] , Undef , [N|Newrest] , [number | Semlist] ,Mode) :- 
[™ % number (X), number (Y) , N is X * 1000 + Y, !, 
p % checklist (Rest, Undef, Newrest, Semlist, Mode) , ! . 
til % check for a literal number %cfnew 

checklist ( [X|Rest] , Undef, [x| Newrest] , [number | Semlist] ,Mode) :- 
number (X) , 

checklist (Rest , Undef, Newrest, Semlist, Mode) , ! . 
% beginning of List is a prefix of a phrase that is a complete finding 
checklist (List, Undef , [Phrase | Newrest] , [cfinding | Semlist] ,Mode) :- 

check_sem_f inding (List , Rest , Phrase) , 

checklist (Rest , Undef, Newrest, Semlist , Mode) , ! . 
% beginning of List is a prefix of a phrase that is in nosemantic lexicon 
checklist (List , Undef , Newrest , Semlist , Mode) : - 

check_no_sem (List, Rest, Phrase) , 

checklist (Rest, Undef , Newrest, Semlist, Mode) , 1 . 
% beginning of List is a prefix of a phrase that is in phrasal lexicon 
checklist (List , Undef , [Phrase | Newrest] , Semlist , Mode) :- 

get_longest_sem (List , Rest , Phrase , Sem) , 

%check_sem(List, Rest, Phrase, Sem) , %change to get longest phrase 

checklist (Rest, Undef , Newrest, Sem2, Mode) , !, 

append (Sem, Sem2 , Semlist) . 
% beginning of List is a single word that is in semantic lexicon 
checklist ( [X|Rest] , Undef, [X | Newrest] , Semlist , Mode) :- 
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collectsem(X, Sem) , ! , 
%foundword(X / Sem) , ! , 

checklist (Rest , Undef ,Newrest, Sem2 ,Mode) , !, 
append (Sem, Sem2 , Semlist) . 
% beginning of List is an undefined word 
checklist ( [X|Rest] , Undef s, Nrest, Semlist , Mode) : - 
checklist (Rest , Undef ,Newrest , Semlist, Mode) , 
(member (X, Undef ) , !; Undefs = [x| Undef], I ) , 
(Mode = skip, !, Nrest = Newrest; 
Mode = bpskip, !, Nrest = Newrest; 
Nrest = [X | Newrest] ) , ! . 

% if beginning is a number followed by a . followed by a non number 
% skip; %cfnew 

checkphrase ( [X, . ] , [X, . ] , [] ) : - ! . 
checkphrase ( [X, . , Z |Rest] , Y, Semlist) : - 

number(X), not (number (Z) ) , checkphrase (Rest , Y, Semlist) , ». 
% beginning of List is a prefix of a phrase that is a complete finding 
% or a phrase in phrasal lexicon 
checkphrase (List , [Phrase [Newrest] , Semlist) :- 

(check_sem_f inding (List , Rest, Phrase) , Sem = [cf inding] ; 

get_longest_sem (List , Rest, Phrase, Sem) . . _ . 

), !, 

%check_sem (List , Rest , Phrase , Sem) ) , ! , 

checkphrase (Rest , Newrest , Sem2 ) , ! , 

append (Sem, Sem2 , Semlist) . 
checkphrase ( [W|Rest] , [W [Newrest] , Semlist) :- 

checkphrase (Rest , Newrest , Semlist) . 
checkphrase ( [],[],[]). 

check_sem_f inding ( [W|Tail] ,Tail,W) :- 

W = [Wl|Rest], % W is bracketed already 

sem_f inding_sent (Wl, W,_) . 
check_sem_f inding ( [W | Tail] , Sf inal , Phrase) : - 

sem_f inding_sent (W, Phrase,_) , 

begsublist (Phrase, [w|Tail] ,Sfinal) , ! . 
sem_f inding_sent (_, _,_) :- fail. 

% check_no_sem(+Sent, -Rest, -Phrase) : removes Phrase from Sent resulting 
% in Rest if Sent begins with a phrase in nosem (non-semantic list) . 
check_no_sem( [w|Tail] , Sf inal , Phrase) :- 

nosem (W, Phrase) , %phrase beg. with W that should be removed 

begsublist (Phrase, [w|Tail] ,S1) , 

remove_comma (SI, Sf inal) , !. % remove if it is next 

%get_longest_sem(+Sent, -Rest, -Phrase, -Sem) : Phrase is longest phrase that is 
% a prefix of Sent; Rest is remainder and Sem is list of semantic classes 
get_longest_sem( Sent, Rest, Phrase, [Sem]) :- 

setof (X,check_sem(Sent,X) ,L) , % set of Phrases 
maxphrase(L, [], Phrase , 0) , % Phrase with maximum length 

append (Phrase, Rest, Sent) , % rest of sentence after Phrase 

f oundword ( Phrase , Sem) . 

% check_sem(+Sent, -Rest, -Phrase, -Sem) : checks if phrase beginning with 

% Sent is in phrasal lexicon; Rest is the remainder of Sent after phrase 

% Sem is the semantic class 

check_sem ( [W | Tail] , Rest , Phrase , Sem) : - 

phrasal (w. Sem, Phrase, _) , 

begsublist (Phrase, [W|Tail] ,Rest) . 



% this also obtains the Target form 

check_sem( [w|Tail] , Rest , Phrase , Sem, Target) : - 

phrasal (W, Sem, Phrase, Target) , 

begsubl is t (Phrase, [W|Tail] , Rest) . 
check_sem{ [w|Tail] , Tail, W, Sem) : - 

is_list (W) , %enclosed in brackets means it is a phrase 

W = [Wl | Rest] , 

phrasal (Wl, Sem, W,_J , t . 
check_sem( [W|Tail] , Tail , W, Sem, Target ) :- 

is_list (W) , %enclosed in brackets means it is a phrase 

W = [Wl | Rest] , 

phrasal (Wl, Sem, W, Target) , ! . 
% check_sem(+Sentence, -Phrase) is similar to check_sem/4 except for fewer args 
check_sem (Sentence, Phrase) :- 

check_sem ( Sent ence,_, Phrase, _) . 



% file util.pl 

%%%%%%%%%%%%%%%% Utility Predicates %%%%%%%%%%% 

% fail an unknown predicate 
: -unknown (_, fail) . 
:- op (900, fy, [not, once]). 
:- op(700, xfx, [\=,~ = ] ) . 

:- dynamic (wfst/6 ) . 
:- dynamic (addstotal/1) . 
:- dynamic (paragno/l) . 
:- dynamic (sectno/l) . 
:- dynamic (phr/4) . 

% wfst (+Rule,+Nuniber,+Res,+Fmt,+SO,+S) : well-formed symbol table 



% Rule is the name of rule; Number is the option number 

% Res is s for success and f for failure 

% Fmt is the format (for successes); for failure Fmt is [] 

% SO is the sentence position at the start of Rule 

% S is the sentence position when Rule has been completed 

% add to wfst 



addst (Rule, Number, Res, Fmt , SO, S) : - 

\+ checkst (Rule, Number, Res, Fmt, SO, S) , %result for rule was saved already 
\+ checkst (Rule, Number, i, Fmt, SO, S) , % result from different rule saved 
( checkst (Rule,_, Res, Fmt, SO, S) , % different rule produced same result 

assert (wfst (Rule , Number , i, Fmt, SO, S) ) ; 
assert (wfst (Rule, Number , Res , Fmt , SO , S) ) ) , ! . 
addst (_,_,_,_,_,_): - !. % always succeed 

% checkst (+Rule, -Number, -Res, -Fmt, +S0, -S) : checks to see if rule has been saved 
% in wfst 

checkst (Rule, Number , Res , Fmt , SO , S) : - 
wfst (Rule, Number, Res, Fmt , SO, S) . 

% beglist(L,Y) - is Y the head of list L 
beglist{ [X|_] ,Y) :- X = Y , ! . 

% splice (+L1, -L2) : LI is a list of lists; L2 is merged list 
splice (LI , L2) :- append (LI , L2 ) , !. 
%splice( [] , [] ) :- ! . 
%splice ([[]], []) :- !. 
%splice( [X] ,X) :- !. 

%splice( [ [] | LI] ,L2) :- splice (LI, L2) ,! . 

%splice( [ [ [] ] | LI] ,L2) splice (LI , L2 ),! . 

%splice ( [X | [[]]], L) : - splice (X, L) , ! . 

%splice ( [L1,L2] ,L3) : - 

% append ( LI, L2,L3) , ! . 

%splice( [X|L1] ,L2) :- 

% splice(Ll,L3) , 

% appendix, L3,L2) , ! . 

%splicerel - works with relations which have Argl, . . .,Argn. 
% It splices a Splicelist in each arg of relation 

splicerel (Finding, Splicelist, Spliced) : - 
splice (Splicelist , Spl) , 

(Finding = [rel , X \ Rest] , spliceargs (Rest , Spl, Sp) , 
%splice ( [ [rel , X]' , Sp] , Spliced) , ! ; 



% same priority and type as \+ 
% same priority and type as = or == 



append ( [rel, X] , Sp, Spliced) , ! ; 

%splice ( [Finding, Spl] , Spliced) ) . 

append (Finding, Spl # Spliced) ). 
%spliceargs - Splices a list' into each element of a list 
spliceargs ([],_,[]) : - ! . 

spliceargs ( [Argl | Rest] , Splicelist , Spliced) :- 

%splice ( [Argl, Splicelist] , Sargl) , 

append (Argl, Splicelist, Sargl) , 

spliceargs (Rest, Splicelist, Srest) , 

%splice ( [ [Sargl] , Srest] , Spliced) . 

append ( [Sargl] , Srest , Spliced) . 
list([], []) . 
list( [x| []] ,X) . 

list ( [X|L1] ,L2) :- list (LI , L3 ) , 

append ( [X] ,L3,L2) , ! . 

% strip (LI, L2) removes extra square brackets from L 
strip ( [L] ,L) . 

% B is a suffix of A and C is the difference 
dif f list (A, B, C) :- append (C,B, A) . 

% S is a sublist at beg. of L if there is a list Rest, which when appended 
% to S results in L. 

begsublist (S, L, Rest) :- append (S, Rest , L) , !. 

% checks that first element in list S has semantic category in Semlist 
firstword( [Wl|_] , Semlist) :- 

atom(Wl) , wdef (Wl, Sem,_) , % semantic category 

member (S em, Semlist ) . 
f irstword( [Wl |_] , Semlist) : - 

is_list (Wl) , phrasal (Wl, Sem,_,_) , 

member (Sem, Semlist ) . 
% removes phrases from first arg that are in nsphrase - lexicon of non-sem. 
phrases 

remove_no_sem( [],[]):-!. 
remove_no_sem ( [w|Tail] ,Sfinal) :- 

nosem(W, Phrase) , %phrase beg. with W 

begsublist (Phrase, [W | Tail] , SI) , %remove from sentence 

remove_comma (SI, S2) , % remove , if it is next 

remove_no_sem (S2 , Sf inal) , !. 
remove_no_sem ( [ W | Tai 1 ] , S f inal ) : - 

remove_no_sem (Tail , SI) , 

append ( [W] , SI, S final) , !. 
remove_comma ( [ ' , ' | Tail] , Tail) . 
remove_comma ( S , S ) . 

% remove_sem(+Sent, -NewSent) : Sent is the original sentence, NewSent is 
% stripped of all phrases that are defined in lexicon 
remove_sem( [],[]) : - ! . 
remove_sem ( S , NewS ) : - 

check_sem(S,Rest,_,_) , % phrase in sent, is in lexicon - remove it 

remove_sem (Rest , NewS) , ! . 
remove_sem ( S , NewS ) : - 

check_no_sem(S,Rest,_) , % phrase in sent, is in nosem list - remove it 

remove_sem (Rest, NewS) , ! . 
remove_sem( [X|Tail] , [X|NewS] ) 

remove_s em (Tail, NewS) , ! . % not a phrase, process rest 
% remove_words (+Sent, -NewSent) : Sent is the original sentence, NewSent 
% is stripped of all words that are in lexicon 
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remove_words ([],[]) : - I . 
remove_words ( [X | Rest] , NewRest) : - 

( (foundword(X) ; number (X) ) , % X is defined in lexicon 
r emove_words (Rest, NewRe s t ) , ! ; 

remove_words (Rest, New) , NewRest = [X|New], ! % X is not in lexicon 

) . 

%maxphrase (+Listof Phrases, +Maxin, -MaxOut, InitMaxLen) is true if 
% ListofPhrase is a list of multi-word phrases, 
% Maxin is phrase with maximum words so far 

% MaxOut is phrase with maximum length of phrases in Listof Phrases 

% InitMaxLen is length of initial phrase which is of max. length 

maxphrase ([], Maxin, Maxin, _) :- !. % no more phrases - maximum is same as maxin 
maxphrase ( [P | Rest] , Maxin, Maxout , InitMaxLen) : - 

length (P, Len) , % length of first phrase 

( Len > InitMaxLen, !, maxphrase (Rest , P, Maxout, Len) ; 
Len < InitMaxLen, !, maxphrase (Rest, Maxin, Maxout , InitMaxLen) 

) . 

%%%%%%%%%%%%%%%%%%%%%%%%%%% lexical interface predicates %%%%%%%%%%%%%%%%%%%%%% 
%acclex (Sem, W, SO, S) : - 

% output form(htext) , !, acclexl (Sem, W, SO , S) . 
acclex (Sem,-W, SO, S) :- ^ ^ . 

acclex2 (Sem,W,SO,S) . 
acclex (Sem, W, SO , S) : - 

acclexss (Sem, Syn, Target , Features , SO , S) . 
% check lexicon for word or phrase, Target form is original W 
acclexl (p, [P,C] , [w|Rest] ,Rest) :- 
is_list (W) , 

f ind_sem_j?hrase (p, [P,C] ,W) . 
acclexl (p, [P,C] , [W|S] ,S) :- atom(W) , 

wdef (W,p, [P,C] ) . 
acclexl (Sem, [W] , [W | Rest] , Rest) : - 

is_list(W), %if bracketed list, get Sem and Code from phrasal lexicon 

f ind_sem_phrase (Sem,_, W) . 

acclexl (Sem, W, [W| S] , S) : - atom(W) , 

wdef (W, Sem,_) . 

% check lexicon for word or phrase, Target form is taken from lexicon 
%acclex2 (Sem, Code, [W | Rest] , Rest) :- 

% is_list(W), %if bracketed list, get Sem and Code from phrasal lexicon 

% f ind_sem_j)hrase (Sem, Code, W) . 

acclex2 (Sem, Code, [w|S],S) :- f oundword (W, Sem, Code) , 

nonvar (Code) . % protect against 

lex. error 

% find a phrase [W|Tail] in lexicon that begins with W and has category Sem 
find_sem_phrase (Sem, Code, [W|Tail]) :- 

phrasal (W, Sem, [W | Tail] , Code) , % phrase and code beg. with W 

nonvar (Code) . 

% case where phrase is already bracketed, look up phrase 
sem_f inding_phrasel (Code, [W|Tail] ,Tail) :- 

is_list(W), %phrase is bracketed 

f ind_sem_sent (Code, W) , 
nonvar (Code) . %protect against lexical error 
% case where phrase is already bracketed, look up phrase 
sem_f inding_phrase2 (Code, [w|Tail] ,Tail) :- 

is_list(W), %phrase is bracketed 
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f ind_sem_sent (Code, W) , 
nonvar (Code) . %protect against lexical error 
% Phrasal succeeds if lexicon contains phrase 
phrasal (Wl, Sem, Phrase, Code) : - 

phrase (Wl, Sem, Phrase, Code, _) . %multi-word phrase in lexicon 
% added MarchlS, 1999 
phrasal (Wl, Sem, Phrase, Code) : - 

semp (Wl, Sem, Phrase, Code , Features) . 
% lexical definition from marked up input 
phrasal (Wl, Sem, [Wl | Tail] , Code) 

phr(Wl, Sem, Tail, Code) . 
acclexss (Sem, Syn, Target , Features , [W | S] , S) : - 
atom(W) , 

semw(W, Sem, Target, Features) , 
synw(W, Synclass) , 
member (Synclass , Syn) . 
acclexss (Sem, Syn, Target , Features , [W|S] ,S) :- 
is_list (W) , 

f ind_phrasess (W, Sem, Syn, Target , Features) . 
f ind_phrasess ( [Wl|fail] , Sem, Syn, Target , Features) :- 
semp (Wl, Sem, [Wl|Tail] , Target , Features) , 
synp(Wl, -[Wl |Tail] , Synclass) , 
member (Synclass, Syn). 

% lexical definition of a complete finding 
f ind_sem_sent (Code , [W | Tail] ) : - 

sem_f inding_sent (W, [w|Tail] , Code) . 

listify(C, [C] ) :- 

atom(C), I. 
listify(CC) :- 

is_list (C) , ! . 

% distributes left mods and right mods over list of findings creating 
% list of lists of findings with mods 
distributemods ([],[] ,_,_,_) :- !. 

distributemods (Dist , [Dl|Tail] , Lmods , Rmods , Type ) :- 

distributemods (Dist2 , Tail , Lmods , Rmods , Type) , %distributed for remainder 
mergemods ( Lmods , Rmods , Al lmods ) , 

f rame (D, Type, Dl, Allmods) , %Type frame with mods 

append ( [D] ,Dist2, Dist) . % Combine findings to get list of findings 

% fixconj - if Leftmods has [certainty, no] , and Conj = or, change Conj to and. 
% no A or B = no A and no B; 'denies A, B, or C is similar, 

fixconj (Leftmods , Conj , [rel , and] ) : - 

(member ( [certainty, no] , Leftmods) ; member ( [certainty, deny] , Leftmods) ) , 

Conj = [rel, or] . 
fixconj Conj , Conj ) . 

% write_sentences/l inputs a PROLOG list and prints out lines 

% which which are English sentences. No wrapping is done. 

write_sentences ( [] ) : - ! . 

write_sentences ( [X] ) :- write (X) , nl . % special sentence - section name 
wri te_sentences ([ , < , ,p / , / , i , > 1 ]) : - 

write (' <p/> ') , nl . % paragraph mark 
write_sentences ( [X | Rest] ) : - 

upper_f irst ( [X|Rest] , [U|Rest]), 
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write (U) , % First letter of first word made upper case 
%write (X) , 

(X = U, chkforpunct (U,Rest) , !, write_terms (Rest ) ; % no space needed 
write ( ' * ), write_terms (Rest) 
) . 



% write_sentence/2 inputs a PROLOG list and prints out an English 

% sentence wrapped. Idlen is the starting position of the sentence 

% in the output. 

% uses libraries ctypes, basic, not 



write_sentence ( [X | Rest] , Idlen) : - 

upper_f irst ( [X | Rest] , [U | Rest] ) , 
write (U) , 

name (U, LU) , length (LU, L) , 

(U = X, chkforpunct (U, Rest) , !, write_terms (Rest , L+Idlen) ; 
write(' ')/ write_terms (Rest , L+Idlen+1) 
) . 

% write_list inputs a PROLOG list and prints out a sentence like list. 

% wrapped. Idlen is the starting position of the list in the output. 

write_list ( [X | Rest] , Idlen) : - 

- write (X) , — - - - 

name(X,LU) , length (LU, L) , 

( chkforpunct (X, Rest) , write_terms (Rest , L+Idlen) , !; 
writeC write_terms (Rest , L+Idlen+1) ) . 

%write_list (+List, +Idlen, -Idlenout) 

% write_list prints out a sentence like list with wrapping if necessary. 

% List is the list to be printed 

% Idlen is the column position at start 

% Idlenout is the column position at end 

write_list ( [] , Len, Len) :- !. 

write_list ( [X | Rest] , Idlen, Idlenout) : - 

atomic (X) , write (X) , 

name(X,LU), length (LU, L) , 

(L + Idlen > 74, nl, Idlen2 =1, ! ; 
Idlen2 = L + Idlen, ! 

) , 

(chkforpunct (X,Rest) , write_list (Rest, Idlen2 , Idlenout ) , ! ; 
write ( ' ' ) , write_list (Rest , L+Idlen2+1 , Idlenout) , ! 

) ; 

isJList(X), write_list (X, Idlen, Idlen2) , writeJList (Rest , Idlen2 , Idlenout) . 

upper_f irst ( [X | Rest] , [U | Rest] ) : - 
name(X, [L | Z] ) , 
(is_alpha(L) , Up is L - 32, ! / Up = L) , 
name(U, [Up|Z] ) , ! . 

% write_terms/l writes out a word followed by blank, except for punctuations. 

write_terms ( [] ) :- !. 

% case where X is end of sentence 

write_terms ( [X | Rest] ) : - 

(X = 1 . ' ; X = ' ; • ) , % last word of sentence 

write (X), nl, !, write_sentences (Rest) , !. 
% case where X is interior of sentence 
write_terms ( [X | Rest] ) 
write (X) , 

(chkforpunct (X, Rest) , write_terms (Rest ) ; 
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write ( ' * ), write_terms (Rest) 
), !. 

% write_terms (List , Used) : writes the terms in list and counts the number 
% of columns used; starts new line if 75 columns have been used 

write_terms ([],_) : - ! . 
% at end of list 

write_terms ( [ . 3 , _) :- write ('.') , nl,!. 
write_terms ([;],_) : - write (';'), nl , ! . 
% X is a punctuation, don't add to final count 
write_terms ( [X | R] , Used) : - 

( R = [] , write (' •), write (X) , !; 

chkforpunct (X, R) , 

write (X) , write_terms (R, Used) , ! 

) . 

% X is last word in sentence 
write_terms ( [X, . ] , Used) : - 

name(X, List), length(List, Len) , 

Need is Len + 2, 

Total is Used + Need, 

(Total =< 75, write (' r ),write(X), write (.) ; 
Total > 75, nl, write ( ' '), write (X), write (.)) , 

nl, ! . — — 

% X is last word in sentence 
write_terms ( [X, ; ] , Used) : - 

name(X, List), length(List, Len), 

Need is Len + 2, 

Total is Used + Need, 

(Total =< 75, write (■ ' ), write (X) , write (';•) ; 
Total > 75, nl, write ( ' ■), write (X), write (.)) , 

nl, ! . 
% X is followed by ■ , • 
write_terms ( [X, ' , 1 |Rest] , Used) : - 

name(X, List), length(List, Len), 

Need is Len + 2, 

Total is Used + Need, 

(Total =< 75, write {' '),write(X), write {','), 
write_terms (Rest, Total) ; 

Total > 75, nl, write ( ' '), write (X), write {',') , 
New is Need - 1, write_terms (Rest , New)), 
I 

% writes blank + name of X, used is length of name+1 
write_terms ( [X | Rest] , Used) : - 

name(X, List), length(List, Len), 

Need is Len + 1, 

Total is Used + Need, 

(Total =< 75, write (' '), write (X) , write_terms (Rest , Total); 
Total > 75, nl, write ( 1 '), write (X) , write_terms (Rest , Len)),!. 
write_terms ( [ * X ' ' s ' | Rest] , Used) : - 
name(X, List), length(List, Len), 
Need is Len + 3 , 
Total is Used + Need, 

(Total =< 75, write (' »), write (X) , write (•" s ") , 
write_terms (Rest, Total) ; 

Total > 75, nl, write(X), write_terms (Rest , Len)),!. 
% processes sentences in Infile; writes formats to Outfile 
% sentences beginning with ' % ' are treated as comments 
testsents (Infile, Outfile) : - 



see(Infile), seen, see(Infile), 

tell (Outf ile) , 

readtests, 

see(Infile), seen, told. 
% reads next sentence and processes it 
readtests : - 

read_in (X) , 
(X = end_of_file, ! ; 
X = [eoff , ' . •] , ! ; 
X = [ " ] , ! ; 

X = [' %'!_]/ i/ readtests; % don't process comments 
preprocess (X, Bs,Undef , Semlist, skip) , 
( Undef = [] , 

dosent (X , Bs , Semlist , Fmt , Message , impression , W , chestxray , strict , 0 ) , 
write_sentence (X, 1) , write (Bs), nl, 
write (Fmt) , nl ; 

Undef \= [] , write_sentence (X, 1) , write(Bs), nl, write (Undef ) , nl) , 
readtests % read next sentence 

) . 

% Reads in all sentences from input file and creates one list of all sentences 
get__inputsents (Prevlist , Toklist) : - 

read_in (X) ,- — • - • - ^ ^ - - 

(X = end_of_file, Toklist = Prevlist, !; 

X = [eoff,'.'], Toklist = Prevlist, ! ; 

X = ['*], Toklist = Prevlist, ! ; 

(lastC',X), append (Toklist, [ ' 1 ] ,X) , !; %remove 

append (Prevlist , X, Newlist) , 

get_inputsents (Newlist , Toklist) 
)) . 

%get_sentence (+A, -B, -C) 

% Gets next sentence from input list containing all sentences read in 

% Don't end a sentence if " . " is preceded by a number and followed by 

% a number and unit measure - 1.25 cm, 1.5 cm, .5 cm 

% or is followed by a " . " which is part of abbreviation 

% get_sentence(A,B,C) - A is list of all sentences in report 

% - B is list containing one sentence 

% - C is remainder excluding B 

% sgml tag for multi-word phrase containing ' . ' that is not end of sentence 
get_sentence ( [ ' < ' ,phr | Tail] , Sentence, LRest) : - 

enclosedPart (Tail, phr, Between, Rem) , % Between beg. part of open phr and 
close tag of phr 

append ( [sem, = , ' " ' , Sem, ' " ' ] , MoreAttributes , Between) , %Sem is value of sem 
attribute 

(MoreAttributes = [■>' | Phrase] , TargetList = Phrase, !; 
MoreAttributes = [t ,=,»"' | TargetPlus] , % Target terms plus end of phr 
append (TargetList, ["",•> • | Phrase] , TargetPlus) , ! % t attribute followed 
by actual phrase 
), 

Phrase = [Wl|Rest], 

append (Phrase, SRest, Sentence) , 

concat_atom (TargetList , Target) , 

assert (phr (Wl, Sem, Rest, Target) ) , % assert lex def according to input 
%Phrase = [Wl | PRest] , 
%abbrev (Wl , [Wl | PRest] , Target , _) , 
get_sentence (Rem, SRest , LRest) , ! . 



% Ignore sentence starting with ' %', get next sentence 
get_sentence (['%', 1 % ' |Rest] , Sent , Remainder) : - 
get_sentence (Rest , _, Rem) , 
get_sentence (Rem, Sent , Remainder) . 
get__sentence( [X, . ,Y,Z| Rest] , [X, .], [Y,z| Rest] ) :- % break up "140. 3 + " 

number (X), number (Y), Z = ' + *, !. % Y belongs to ' + • for new sentence 
get_sentence ( [X, . ,Y,Z|Rest] , [N|SRest] , LRest) :- % 1.5 cm 

number (X) , number (Y) , 
% (wdef (Z,unit,_) ; Z = x) , 
Z \= • + », % break up "140. 3 + " 
t 

name(X,Dl), name(.,D2), name(Y,D3), name ( ' E+00 ' , D4) , 
append ( [D1,D2,D3,D4] ,D) , name(N,D), % put number together 
get_sentence ( [Z|Rest] , SRest , LRest) . 
% common abbrev 

get_sentence< [X, . | Rest] , [X| SRest] , LRest) :- % abbrev ending in "." 

% list of common abbreviations seen in reports should not end sentence 

member (X, [vs , dr , cm, mg] ) , get_sentence (Rest , SRest , LRest) , 1. 
% list of start of names in reports should not end sentence 
get_sentence ( [X, . |Rest] , [XjSRe'st] , LRest) :- % abbrev ending in " . " 

member (X, [ms, mr , mrs , dr , st] ) , 
- skipname (Rest , RestO) , % skip name part . 

get_sentence (Rest 0, SRest, LRest) , ! . 
% more known abbreviations 

get_sentence ( [Wl | Rest] , [Rep | SRest] , LRest) : - 

abbrevchk( [Wl|Rest] ,_,Rem,Rep) , % abbreviation 

get_sentence (Rem, SRest , LRest) , ! . 
% possible simple xml tag for new paragraph 

get_sentence( ['<» ,p, '/','>' | Rest] , Sent, Rem) :- %skip paragraph marker 

get_sentence (Rest , Sent , Rem) , 1 . 
% xml tag for sentence ' <s>' 

get_sentence ([^'^s,^'! Tail] , Sentence , Rest) : - 
enclosedPart (Tail , s , Sent , Rest) , 

(last ('.', Sent) , Sentence = Sent, ! ,* %already has 1 .' 
append (Sent , [ . ] , Sentence) 
) , ! . %add » . ' 

get_sentence( [. | Rest ],[.], Rest) :- I. %end of a sentence 
get_sentence ( [ ; j Rest] , [ ; ] , Rest) : - ! . 
% interior of sentence 

get_sentence ( [X | Rest] , [X | SRest] , LRest) : - 

get_sentence (Rest, SRest, LRest) . 
get_sentence ( [],[],[]). % no more sentences 

% abbrevchkf+WordList, -AbList, -RemList, -Target) is true if an abbrev is prefix 
% of WordList, RemList is suffix of WordList (excluding prefix), 
% AbList is prefix consisting of abbreviation 
% and Target is target form of abbreviation 
abbrevchk ( [Wl | Rest] , AbList , RemList , Target ) : - 

abbrev (Wl, AbList, Target, Dom) , % abbrev knowledge base indexed by 1st word 

append (AbList, Rem, [Wl | Rest] ) , % remainder of abbrev. must be in sentence 

(Dom = general, ! ; % abbrev. applies to all domains 
domain (Thisrep) , Dom = Thisrep, !; % abbrev. applies to this domain 
is_list (Dom) , member (Thisrep, Dom) % this domain in abbrev. list 

>, 

( % add back ' . • to sentence if it also signals end of sentence 
Rem = [] , last ( • . 1 , AbList) , RemList = ['.'], ! %no more words 
; % words that generally start a new sentence 



Rem = [W2|_], last ( ' . ' , AbList) , member (W2 , [his, her, he, she, the, this] ) , 
RemList = [ * . ' | Rem] , I 
% don * t add ' . • back 
RemList = Rem 

) . 

% skipname (+Beglist, -Endlist) : skips next word after "mr" or "st" 
skipname {[],[]) : - ! . 

skipname < [_, ,,,, ,s|Rest] , Rest) :- !. % "Luke's" 
skipname { [o, ' ' •' ,_| Rest] , Rest) : - !. % "0 1 Grady 
skipname ( [_| Rest] , Rest) :- !. 

%get_section (+Toklist, -Sents, -Rest, -Section, -Printname, Addno) 
% Toklist contains input list; 1st sentence should be a header; 
% Sents are all sentences in section; Section is name of section 
% Sentences at beg. of Toklist are ignored until a section header is found 
get_section( [T| Toklist] , Sents, Rest , Section, Printname , Addno) : - 
% first sentence should be section header 
get_sentence ( [T| Toklist] , Sentence, RToklist) , 

(section_header (Sentence, Rsent, Section, Printname) , % Sentence is a section 

header 

append (Rsent , RToklist , RToklist2 ) , 
get_sectionsents (RTokl is t2 , Sents , Rest ) , 

(Addno = 0, !; % testing if input begins with section header 

Addno = 1, ! , sectno (Sectno) , Newno is Sectno + 1, 

retractall (sectno (_) ) , assert (sectno (Newno) ) 
>, 

retractall (paragno(_) ) , assert (paragno (1) ) , %lst parag. of section 
retractall (sentno (_)) , assert (sentno ( 0) ) %lst sentence of parag. 
% 1st sentence is not a legitimate header - return [] 
Section = [] 

% get_section (RToklist, Sents, Rest, Section) % skip till find header 
), !• 

get_section( [],[],[], [] ,_,_) • 
get_sectionsents ([],[],[]) : - ! . 
get_sectionsents (Toklist, Slist , Rest) : - 

get_sentence (Toklist, Sentence, RToklist) , % one sentence 
(\+ section_header (Sentence, _,_,_) , %more sentences in section 
get_sectionsents (RToklist , RSents , Rest) , 
append (Sentence, RSents , Slist) 

; % the next section is a section header - return 
Rest = Toklist, Slist = [] ) . 

sect ion_header (S, Rests, ' report clinical information item', 
'CLINICAL INFORMATION: . ' ) : - 
(S = [clinical, information, ' :','.'] , ! , Rests = [] ; 
begsublist ( [clinical, information, ' : ' ] , S, Rests) , ! ; 
S = [clininfo, ':*,'. ! ] , Rests = [] , ! ; 
begsublist ( [clininfo, • : ' ] , S, Rests) , ! 
) . 

section_header (S, Rests, * report impression item' , 
• IMPRESSION: . ' ) : - 
(S = [impression, 1 :*,.] , Rests - [] , !; 
begsublist ( [impression, ' : ' ] , S, Rests) , ! 
) . 

section_header (S, Rest, 'report summary item' , ' SUMMARY : . » ) :- 
S = [summary, * : 1 |Rest] . 



si 

section_header (S, Rests, 'report description item' , 'DESCRIPTION: . ') :- 
(S = [description, ':',.], Rests = [] , ! ; 
begsublist { [description, * : ' ] , S, Rests) , ! 
) . 

sec tion_header(S, Rest, 'report diagnosis item' , ' DISCHARGE DIAGNOSIS: . ') :- 
(S = [discharge, diagnosis , ' : ' |Rest] ; 
S = [final, diagnosis, ' : ' |Rest] ; 

S = [principle, diagnosis, ':' |Rest] ; S = [associated, diagnosis, ':' | Rest] ; 
S = [transfer, diagnosis, ' : ' |Rest] ; 
S = [diagnosis ,'(', es ,')',':' | Rest] ; 
S = [diagnosis, : | Rest] 
), !. 

section_header(S, Rest, 'report laboratory data item', 'LAB DATA:.') :- 

S = [laboratory, data, ' : ' |Rest] , ! . 
section_header (S,Rest, 'report medications item' , 'MEDICATIONS: . ') :- 

S = [medications, ' : ' |Rest] , ! . 
section_header(S, Rest, 'report current medications item' ,' MEDICATIONS :.' ) :- 

S = [current , medications , ' : 1 |Rest] , ! . 
section_header(S, Rest, 'report discharge medications item ; , 

• DISCHARGE MEDICATIONS : . ' ) : - 
=— S = -[discharge, medicat ions, ' : ' [Rest] , ! . _ 
section_header (S,Rest, 'report discharge disposition item', 
' DISCHARGE DISPOSITION : . ' ) : - 
S = [discharge, disposition, ' : ' |Rest] , ! . 
sect ion_header (S, Rest, ' report medications on admission item', 
'MEDICATIONS : . ' ) : - 
S = [medications, on, admission, ' : ' |Rest] , I . 
section_header(S, Rest, ' report medications on transfer iterm' , 
•MEDICATIONS: . ') :- 

S = [medications, on, transfer, ' : 1 |Rest] , ! . 
sect ion_header(S, Rest, 'report procedure item' , 1 PROCEDURE : . ' ) :- 
(S = [operation, ' : ' |Rest] ; S = [procedure, ' : ' |Rest] 
) , ! • 

section_header(S, Rest, 'report indications for procedure item 1 ,' INDICATIONS : 

(S = [indications, for, procedure, ':* |Rest] ; S = 

[indications, for, operation, ' : ' |Rest] 

) , 
i 

section_header(S, Rest, 'report preoperative diagnosis item',*PREOP DIAGNOSIS 

S = [preoperative, diagnosis, • : * |Rest] , ! . 
section_header(S, Rest, 'report admitting diagnosis item *, 'ADMITTING 
DIAGNOSIS: . ' ) :- 

S = [admitting, diagnosis, ' : * [Rest] , !. 
section_header (S,Rest, 'report postoperative diagnosis item' , 'DIAGNOSIS: . ') 

S = [postoperative, diagnosis, ' : * |Rest] , ! . 
section_header (S, Rest, ' report physical examination item', 
'PHYSICAL EXAM: . ' ) : - 

S = [physical, examination, ' : ' (Rest] , ! . 
section_header(S, Rest, 'report chief complaint item', 'CHIEF COMPLAINT:.') :- 

S = [chief , complaint, ':' |Rest] , !. 
section_header(S, Rest, 'report hospital course item ',' HOSPITAL COURSE:.') 

S = [hospital, course, ' : ' |Rest] , ! . 
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sectionjieader (S, Rest, 'report allergy item' , ' ALLERGIES : . ') :- 
S = [allergies, ' : • [Rest] , ! . 

sectionjieader (S, Rest, 'report follow up item' , 1 FOLLOW UP: . ') :- 

S = [follow, up, • : ' |Rest] , !. 
section_header ( S , Rest , ' report findings item • , ' FINDINGS : . ' ) : - 

S = [findings, ':' |Rest] , !. 
section_header (S, Rest, 'report indications and findings item* , f FINDINGS : . ' ) 

S = [indications, and, findings, ':' |Rest] , !. 
section_header (S, Rest, 'report indications and findings item ',* INDICATIONS : . 

S = [indications, ' : ' |Rest] , ! . 
section_header(S, Rest, 'report provisional diagnosis item 1 , ' PRELIM DIAGNOSIS 

S - [provisional, diagnosis, ' : ' |Rest] , ! . 
section_header(S, Rest, 'report review of systems item' ,' REVIEW OF SYSTEMS:.' 

S = [review, of , systems, * : * |Rest] , ! . 
section_header (S, Rest, 'report past history item', 'PAST MEDICAL HISTORY:.') 

S = [past , history, section, * : ' |Rest] , ! . 
sectionjieader (S, Rest, 'report past history item»,'PAST MEDICAL HISTORY:.') 

S = [past , medical, history, ' : ' |Rest] , ! . 
sectionjieader (S,Rest, 'report social history item' , 'SOCIAL HISTORY: . ') :- 

S = [social , history, • : ' | Rest] , ! . -^=- _ . .. . 

sectionjieader (S, Rest, 'report past history item', 'PAST MEDICAL HISTORY:.') 

S = [history, ' : • |Rest] , ! . 
section header (S, Rest, 'report past history item', 'PAST MEDICAL HISTORY:.') 

S = [brief , history, ' : ' |Rest] , ! . 
sectionjieader (S, Rest, 'report history of present illness item', 
'HISTORY OF PRESENT ILLNESS:.') :- 

S = [history, of , present, illness, ': 1 |Rest] , !. 
sectionjieader (S, Rest , 'report history of present illness item', 
'HISTORY OF PRESENT ILLNESS:. 1 ) :- 

S = [history, of, the, present, illness, 1 :' |Rest] , !. 
sectionjieader (S, Rest, 'report specimen item' , 1 SPECIMEN' ) :- 

S = [specimen | Rest] , !. 

% sentence consists of id number only or "." only, 
isidentif ier ( [X, . ] ) :- 

integer (X) . 
isidentif ier ( [X, ;] ) :- 

integer (X) . 

isidentif ier ([.] ) :- !. % sentence consists only of . 
isidentif ier (['.',' <eos> ' ] ) : - ! . 

isident if ier (['<' ,p, '/','>'] ) :- % paragraph marker sentence - update no. 
paragno (N) , 

retractall (paragno (_) ) , 
Newno is N + 1, 
assert (paragno (Newno) ) , 
retractall (sentno (_) ) , 
assert (sentno (0) ) . 

% skipsentence is true, if sentence should be ignored. 
% Skip sentences containing family info 
skipsentence ( [X | ) :- 

foundword(X, family) , ! . 
skipsentence ( [X | _] ) : - 

foundword (X, insurance) , ! . 
% This occurs if sentence contains 
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% a sequence in skips database and sentence also contains findings. 

skipsentence ( [X | Rest] , Semlist , Error) : - 

skips { [x|Sseq] ) , % X is the beg. of subseq. in skip database 
prefix { [X | Rest] , [X|Sseq] ) , % sentence contains subseq. 
(subtype (_, Semlist) , % sentence contains information to be extracted 
Error = no; % don't try to segment 

Error = yes), !. % treat sentence as error and try to segment. 

skipsentence ([_ | Rest] , Semlist , Error) :- 
skipsentence (Rest, Semlist , Error) . 

% f indingseg (+S, -Fseg, -Begseg) : partitions sentence 



% S is the sentence; Begseg is the segment preceding the 
% modifiers of the finding; Fseg is the segment of S starting 

% with the leftmost modifier of the finding and consists of the 

% remaining sentence. 



f indingseg (S, Fseg, Begseg) : - 

partition (S, Begpart , Restpart) , 
(Begpart = [] , Begseg = [] ; 
Restpart = [] , Fseg = [] , Begseg = S; 
rightlstmod (Begpart, Begseg, Modseg) ) , 
append (Modseg, Restpart , Fseg)-. - 
f indingseg (_, [] ,_) :- !. 
actionf indingseg (S , Fseg, Begseg) : - 

partition (S, Begpart, Restpart) , 
(Begpart = [] , Begseg = [] ; 
Restpart = [] , Fseg = [] , Begseg = S; 
reverse (Begpart , ReversedBef ore) , 

f indsubstance (ReversedBef ore , Rest ) , 
append (Subs tancepart , Rest , ReversedBef ore) , 
reverse (Subs tancepart, Leftpart) , 
reverse (Rest, Begseg) , 
append (Leftpart , Restpart , Fseg) ) . 
actionf indingseg (_, [] ,_) :- ! . 
f indsubstance ([],[]):- ! . 
f indsubstance ( [X | Rest] , Rest) : - 

substance (_, [X] ,[]),!. 
f indsubstance ( [X | Restl] ,Rest) :- 
f indsubstance (Restl, Rest) . 



% partition (+S, -Begpart , -Restpart) : partitions sentence 
% S is initial 

% partition (+S, -Begpart, -Restpart) : partitions sentence 

% S is initial sentence; Begpart is part of sentence before the 

% finding; Restpart is the rest of the sentence and starts with 

% the finding. If there are 2 consecutive findings 

% the 1st one is considered a modifier 



partition ( [],[],[]) :- ! . 

partition ( [X | Rest] , [X | Begpart] , Restpart) : - 

not (isfinding(X) ) , !, partition (Rest , Begpart , Restpart) . 

partition ( [X, Y | Rest] , [X] , [Y | Rest] ) : - 
isf inding (X) , isf inding (Y) , !. 

partition ( [X|Rest] , [] , [X|Rest] ) : - 
isf inding (X) , ! . 

% isf inding (+X) : is true if X is a word or phrase whose semantic class 
% is a finding or subtype of finding. 
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isfinding(X) :- 

foundword (X, Sem) , % semantic class of word 

subtype {_, [Sem] ) . % is class a type of finding, recommend, or technique 

% semantic class which are types of relevant information 
subtype (finding, Sem) : - 

intersect (Sem, [attach, createbond, breakbond, activate, 
inactivate , substitute , transcribe , express , promote , 
signal] ) . 

% there is only one type of technique class 
subtype (technique, Sem) :- 

member (technique, Sem) . 
subtype (time, Sem) : - 

intersect (Sem, [status, sstatus, change, tmper , vstatus] ) . 
f indinginlist (Sem) : - 

intersect (Sem, [attach, createbond, breakbond, activate, 
inactivate, substitute, transcribe, express, promote, 
signal] ) . 

% chkforpunct (+W,+Rest) : is true if there should be no space after word W 
chkforpunct (W,_) :- member (W, [ ' / ' , • < 1 , ' > ' , ' - ' , ' " 1 , 5 L ; , ; ] ! , 

'{•,'}' ,•_•,' + ',' = ',' | \ '\'] ) , ! . 
% nothing left to write . - ^ _ ^_ 
chkforpunct (W, [] ) : - ! . 

% is true if there should be no space before word after current word 
chkf orpunct (_, [W|_]) :- 
ispunct (W) . 

% ispunct (+W) is true if W is a punctuation for sentence print out 

% The following characters are not treated as punct: - " # $ * & * 

ispunct (W) : - member (W, [',',' .•,';','/",* < ' ,'>','? ' , ' " 1 , l " ' * ' : ' > ' "' ' ' t ' ' * ^ ' ' 

' { ' , 1 } ' , ' ( ' , ') ' , / , , ' I ' / '\' i * ,@ '^ * 
% rightlstmod(List, Firstpart , Modpart) : Modpart begins with the first 
% word in List which is a modifier; Firstpart are the preceding words 
rightlstmod( [],[],[]) : - ! . 

% X is a modifier or finding; Beginning part is empty 
rightlstmod ( [X | Rest] , [] , [X | Rest] ) : - 
foundword (X, Sem, Target) , 

(modifier (Sem) ; Sem = p, Target = [_,conn]; subtype (_, [Sem] )) , !. 
% X is not a modifier or finding 
rightlstmod ( [X|Rest] , [X | Firstpart] , Modpart) :- 

rightlstmod (Rest, Firstpart , Modpart) . 

% frame (Frame, Type, Value, Mods) : creates a list Frame, whose 1st 

% element is Type, 2nd element is Value, and 3rd is a list of 

% modifier frames or is emtpy 

% Case where modifier list is empty; Value should be atom except for 
% certain types; 

frame ( [Type, Value] , Type, Value, X) :- 
(X = []; X = [[]]), 
atom (Value) , ! . 
% Special cases where value of type should be a list 
frame( [Type, [H|R] ] ,Type, [H|R] ,X) :- 
(X = [] ; X = [[]]) , 
oklist (Type) , ! . 

% Modifier list is merged with list consisting of Type and Value 
frame ( Frame , Type , Value , Mods ) : - 
atom (Value) , 

append ( [Type, Value] , Mods, Frame) , ! . 
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frame (Frame, Type, [H|R] , Mods) :- 
is_list (R) , 

append ( R , Mods , NewMods ) , 
append ( [Type, H] , NewMods, Frame), !. 
% Components of Frame 

frame ( [Type, Value | Mods] , Type, Value, Mods) :- ! . 

% Value of Type should not be a list; first element of value is real value 

frame ( [Type, H, Rest] ,Type, [H|Rest] , [] ) : - ! . 

% Special cases where value of type should be a list 

%frame ( [Type, [H|R]],Type, [H | R] , [] ) :- %repeated from rule above 

% oklist (Type) , ! . 

% Value of Type should not be a list; first element of value is real value 
frame (Frame, Type, [H|Rest] ,Mods) :- 

mergemods (Rest , Mods, NewMods) , 

append ( [Type , H] , NewMods , Frame) . 

% mergemodinf (-F, +Frame, +Mods) : Frame is a type-value-mod frame; Mods 
% is an additional set of modifiers for Frame; mergemodinf adds Mods 
% to Frame, resulting in F. 
mergemodinf ([],[],_):-!. 
mergemodinf (F, [rel,X|Rest] ,Modrel) :- 
= — mergemodinf (Fl, Rest , Modrel) ,. 

append ( [rel , X] , Fl , F) , ! . 
mergemodinf (F, [Fl, X | Modf in] , Modrel) :- 

atom(Fl) , mergemods (Modrel, Modf in, Mod) , 

append ( [Fl , X] , Mod, F) , ! . 
mergemodinf (F, [H|R] , Modrel) :- 

mergemodinf ( Fl , H , Modrel ) , 

mergemodinf (F2 , R, Modrel) , 

append ( [Fl] ,F2,F) . 

% addmodstof (+Args, +Mods, -NewArgs) is true if Args is a list of formats, 

% Mods is a list of modifiers and NewArgs is a list of formats where Mods 

% has been added to modifier list of that format 

addmodstof ( [] ,_, [] ) :- ! . % no more formats 

addmodstof ( [Formatl | Rest] ,Mods, [Fl |NewRest] ) : - 

mergemodinf (Fl, Forma tl, Mods) , % merge modifiers into 1st format 
addmodstof (Rest, Mods, NewRest) , !. %add modifier to remaining 

% oklist (+Type) : is true if Type can have a list as its value 

oklist (unitval) . 

oklist (age) . 

oklist (measure) . 

oklist (prev_timeunit) . 

oklist (future_exam) . 

% mergemods (+Modsl, +Mods2, -Mod) : Modsl and Mods2 are a list of modifier lists 

% Mod is the merged list; some elements of Modsl and Mods2 may be 

% empty 

mergemods ([], M, M) :- !. 

mergemods (M, [] ,M) . 

mergemods (Modsl , Mods 2 , Mod) : - 

delete (Modsl, [] ,M1) , 

delete (Mods2, [] ,M2) , 

append (Ml, M2, Mod) . 

% addmod(+Mod, +Modlist, -NewMod) : NewMod is formed by including 
% Mod into Modi is t 

addmod( [] , Mod, Mod) : - ! . 
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addmod (Mod, [] , [Mod] ) : - ! . 
addmod ( Mod , Modi i s t , NewMod ) : - 

append ( [Mod] , Modlist , NewMod) . 
% modlist (+Listof Mods, -Mods) : ListofMods is a list consisting of 
% individual modifier frames, some of which may be empty 
% Mods is formed as a list of non-empty modifiers 
modlist ( [],[]) : - ! . 

% ignore a modifier which is an empty list 
modlist ( [ [] |R] ,Mods) :- 

modlist (R, Mods) , ! . 
modlist ( [ [H|R1] |R2] ,Mods) : - 

atom(H) , ! , 

modlist (R2 , Rmods) , 

addmod ( [H | Rl] , Rmods , Mods) . 
modlist ( [[H|R1] |R2] ,Mods) :- 

is_list(H), ! , % is first element is a list 

modlist (R2 , Rmods) , 

mergemods ( [H|R1] , Rmods, Mods) . 

%bpframe: creates from for sequences of bodyloc /region/posit ion- 
bpframe(F, [] ,_,F, [] ) :- !. % only 1 bodyloc 

bpf rame ( F , [ ] , Type , Bpl , Bp2 ) :- % no conj relation but more than 1 bodyloc 
frame (Bpl , BplType , BplVal , BplMods) , %contents of Bpl frame 
frame (Bp2 , Bp2Type , Bp2Val , Bp2Mods) , %contents of Bp2 frame 
( (BplType = region; BplType = position) , 
Bp2Type = bodyloc, % 'left lung 1 , 'area of lung' 
mergemods (BplMods, Bp2Mods, BpMods) , %new region modifier 
frame (NewBp2Mods, BplType, Bp lVal,BpMods) , %new Bpl frame w new mod 
frame (F, Bp2 Type, Bp2Val, [NewBp2Mods] ) % main frame is bodyloc 

BplType = bodyloc, Bp2Type = bodyloc, Type = main, %Bp2 is main 

mergemods (BplMods, Bp2Mods, BpMods) , %new bodyloc modifier 

frame (NewBp2Mods, BplType, BplVal, BpMods) , % 'joint of shoulder' 

frame (F,Bp2Type,Bp2Val, [NewBp2Mods] ) % main bp frame is shoulder 

mergemods (BplMods , Bp2Mods , BpMods ) , 

frame (NewBplMods , Bp2Type , Bp2Val , BpMods ) , % * shoulder j oint ■ 
frame (F, BplType, BplVal, [NewBplMods]) % main bp frame is shoulder 

), !- 

bpf rame (F, Rel , _, Bpl , Bp2) :- % no conj relation but more than 1 bodyloc 
Rel = [rel, Conj |_] , Bp2 \= [] , 
mergemods ( [Bpl] , [Bp2] ,Conjargs) , 
f rame (F, rel, Conj , Conj args) . 

getrelation (R, Fl , F2 , F) : - 
(F2 \o [], 

(Fl = [rel, Conj 1 |Restl] , R = [rel, Conj], 

(Conjl = ','; Conjl = or; Conjl = and), 
(Conj = Conj = or; Conj = and); 

Restl = [Fl] ) , 
(F2 = [rel, Conj 2 |Rest2] , 

(Conj 2 = • ,'; Conj 2 = or,* Conj 2 = and); 

Rest2 = [F2] ) , 
%splice ( [R, Restl , Rest2] , F) ; 
append ( [R, Restl , Rest2] ,F) ; 
F2 = [] , F = Fl ) . 



uptotal : - 

addstotal (X) , 

X =< 50, 

NewX is X + 1, 

retractall (addstotal (X) ) , 

assert (addstotal (NewX) ) , 
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$save{ 1 a ' 
$save{ 'b ! 
$save{ ' c ' 
$save{ 'd' 
$save{ ' e 1 
$save{ ' f ' 
$save{ *g • 
$save{ 'h' 
$save{ ' i ' 
$save{ ' j ' 
$save{ 'k' 
$save{ ' 1 ' 
$save{ 'm' 
$save{ ' n ■ 
$save{ ' o' y 
$save{ 'p • } 
$save { 
$save{ 
$save{ 
$save{ 
$save{ ' 
$save{ 1 
$save{ ■ 
$save{ * x 
$save{ ' y ' 
$save{ 1 z ' 
$save{ ' 0 1 
$save{ ' 1 ' 
$save{ '2 ' 
$save{ '3' 
$save{ 1 4 ' 
$save{ • 5' 
$save{ 1 6 ' 
$save{ ' 7 ' 
$save{ ' 8 ' 
$save{ ' 9 ' 
$save{' ' 
$save{ • ] ■ 
$save{ ' [ ' 
$save{ ' ; » 
$save{ ' i ' j — 
$save{ • " ' } = 
$save{ ' \ ' ' } 
Ssavej 1 ? ' } = 
$save{ 1 ! • } = 
$save{ ' #' }= 
$save{ ' $ ' } = 
$save{ ' A » * 
$save{ • &' 
$save{ • * 1 
$save{ ' ( 1 j — 
$save{ 1 ) ' }= 



= ' AAAC 
= 1 AAAG 
= ' AAAT 
: 'AACC 
: ' AACG 

■ 1 AACT 
: ' AAGC 

■ ' AAGG ' 
: ' AAGT ' 

' AATC ' 
' AATG ' 

' ACAC 1 
1 ACAG ' 
' ACAT ' 
' ACCC 1 
' ACCG * 
1 ACCT 1 
• ACGC ' 
■ ACGG ' 

* ACGT » 
• ACTC » 
■ ACTG ' 
• ACTT ' 
•AGAG' 
' AGAT > 
■ AGCC 1 
' AGCG ' 
■ AGCT ' 
' AGGC ' 

* AGGG ' 
' AGGT ' 
' AGTC ■ 
• AGTG ' 
1 AGTT ' 
' ATAT * 
' ATCC ' 
1 ATCC ' 
' ATCC ' 

* ATCC » 
' ATCC ' 
' ATCC * 
= 1 ATTC 
' ATCC ' 

' ATCC ' 
1 CCCG ' 
» CCCT ' 
1 CCGG » 
' CCGT ' 
CCTG » 
ATCC ' 
ATCC 1 
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A ppendix . p 

# ! /usr/bin/perl 
#Scan.pl : Scans blast output 
#Author: Michael Krauthammer 
#Copyright: c.1999, Columbia University 

#Variables 

#blast input/file 
$input_f ile="genebank. result" ; 
ttprogram output 
$output_file= "match. txt" ; 

#open datastream for file which contains blast output 

open (INPUT, ' /storage/psi -blast/Marklt/programs/marklt . result ' ) / 

while ($line=<INPUT>) { 

if ($line=~/\>gi\| (\d*) (.*) \ , (.*) \ ,(.*)/) { 
$ target = $4;^ = - = . . _ _ 
$gi =$1; 

$semantic_class=$3 ; 
} 

if ($line=~/Length = (.*)/){ 
$lengthl=$l; 
} 

if ($line=~/Identities \= (\d*)\//){ 
$length_actual=$l 

} 

if ($line=-/Query: (\d*)/){ 
$start=$l ; 
} 

#print if Subj 1, sometimes match 2 or 3 line long 

if ($line=~/Sbjct : 1 /) { 
if ( ($length__actual/$lengthl) > .9){ 
print 

$target, " | ", $start, " | " , $start+$lengthl , » | " , $semantic_class , " | ", $gi, "\n»; 
} 
} 
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Appendix (q 

# ! /usr/bin/perl 

#nucleot ide_text_parser.pl 

#Author: Michael Krauthammer, c.1999 Columbia University 
open ( INPUT , $ ARGV [ 0 ] ) ; 

#read uncoded input text line by line (chop it) 
$all="; 

while ($line=<INPUT>) { 
$all=$all.$line; 

} 

open (INPUTII, ' /storage/psi-blast/Marklt/programs/markltll . result ■ ) ; 
open (OUTPUT, ' >result . txt 1 ) ; 

#first part: check matches, store positions 1 
wh i 1 e ( $ I i ne = < INPUT! I > ) { 

! 

($name, $start , $end, $semantic_class , $gi) =$line=~/ { . * ) \ | ( . * ) \ | ( . * ) \ | ( . * ) \ | ( . * ) / 

#divide by 4 (4 letter code) 
$start= ($start-l) /4 ; 
$end= ($end-l) /4; 

#get substring 
if ($start != 0) { 

$letters = substr ($all, $start-l , $end-$start+3 ) . n | "; 
} else { 

$letters = ' ' . substr ($all , 0 , $end+2 ) . " I " ; 

} 

($letter_beginning) =$letters=-/ ) /; 
$letter_end=substr ($all, $end, 1) ; 
$letter_endll = substr ($all , $end, 2 ) ; 

#ignore matches that are in the MIDDLE of sentences, allow plurals 
$letter_beginning=-tr/ [A-Z] / [a-z] / ; 
$letter_end=-tr/ [A-Z] / [a-z] /; 

if ( ( ! ($letter_beginning=~/ [a-z] /) ) && (.( ! ( $letter_end=~/ [a- z] / ) ) || 
($letter_endll=~/s /))){ 

#make sure only the first occurence is stored at this position 

if ($save{$start }=='■) { j 

$save{$start}=$end. ' | * . $semantic_class . 1 | 1 .$gi; 

} 

foreach $key (keys (%save) ) { 
($end_key) =$save { $key) ( - *) \ | /; 
if ($end_key>$end) { 
if ($key<$start) { 

$save{$start}= 'null • , 

} 

} 

} 

} 
} 
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#second part: print out marked up document 
sort (%save) ,* 

for ($i=0;$i<length($all) ;$i++) { 

if ( ( !$save{$i}=='null' ) && ($save{$i}=~/ . /) ) { 
($end, $semantic_class) =$save{ $i } =-/ ( . *) \ | ( . *) \ | / 
print OUTPUT ■ <phr= » ■ , $semantic_class , ' » > • ; 
$store=substr ($311, $i, $end-$i) ; 
print OUTPUT $store; 
print OUTPUT "</phr>"; 
$i=$end-l; 

} else { 
$store=substr ($all, $i, l) ; 
print OUTPUT $ store; 

} 

) 
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